blob: 9f847bd834fa68d4f85b06f5a40657eb385b3baf [file] [log] [blame]
Evan Chenga8e29892007-01-19 07:51:42 +00001//===-- ARMISelLowering.cpp - ARM DAG Lowering Implementation -------------===//
2//
3// The LLVM Compiler Infrastructure
4//
Chris Lattner4ee451d2007-12-29 20:36:04 +00005// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
Evan Chenga8e29892007-01-19 07:51:42 +00007//
8//===----------------------------------------------------------------------===//
9//
10// This file defines the interfaces that ARM uses to lower LLVM code into a
11// selection DAG.
12//
13//===----------------------------------------------------------------------===//
14
15#include "ARM.h"
16#include "ARMAddressingModes.h"
17#include "ARMConstantPoolValue.h"
18#include "ARMISelLowering.h"
19#include "ARMMachineFunctionInfo.h"
20#include "ARMRegisterInfo.h"
21#include "ARMSubtarget.h"
22#include "ARMTargetMachine.h"
23#include "llvm/CallingConv.h"
24#include "llvm/Constants.h"
Bob Wilson1f595bb2009-04-17 19:07:39 +000025#include "llvm/Function.h"
Evan Cheng27707472007-03-16 08:43:56 +000026#include "llvm/Instruction.h"
Lauro Ramos Venancioe0cb36b2007-11-08 17:20:05 +000027#include "llvm/Intrinsics.h"
Chris Lattner84bc5422007-12-31 04:13:23 +000028#include "llvm/GlobalValue.h"
Bob Wilson1f595bb2009-04-17 19:07:39 +000029#include "llvm/CodeGen/CallingConvLower.h"
Evan Chenga8e29892007-01-19 07:51:42 +000030#include "llvm/CodeGen/MachineBasicBlock.h"
31#include "llvm/CodeGen/MachineFrameInfo.h"
32#include "llvm/CodeGen/MachineFunction.h"
33#include "llvm/CodeGen/MachineInstrBuilder.h"
Chris Lattner84bc5422007-12-31 04:13:23 +000034#include "llvm/CodeGen/MachineRegisterInfo.h"
Bob Wilson1f595bb2009-04-17 19:07:39 +000035#include "llvm/CodeGen/PseudoSourceValue.h"
Evan Chenga8e29892007-01-19 07:51:42 +000036#include "llvm/CodeGen/SelectionDAG.h"
Evan Chengb6ab2542007-01-31 08:40:13 +000037#include "llvm/Target/TargetOptions.h"
Evan Chenga8e29892007-01-19 07:51:42 +000038#include "llvm/ADT/VectorExtras.h"
Evan Chengb01fad62007-03-12 23:30:29 +000039#include "llvm/Support/MathExtras.h"
Evan Chenga8e29892007-01-19 07:51:42 +000040using namespace llvm;
41
Bob Wilsondee46d72009-04-17 20:35:10 +000042static bool CC_ARM_APCS_Custom_f64(unsigned &ValNo, MVT &ValVT, MVT &LocVT,
Bob Wilson1f595bb2009-04-17 19:07:39 +000043 CCValAssign::LocInfo &LocInfo,
44 ISD::ArgFlagsTy &ArgFlags,
45 CCState &State);
Bob Wilsondee46d72009-04-17 20:35:10 +000046static bool CC_ARM_AAPCS_Custom_f64(unsigned &ValNo, MVT &ValVT, MVT &LocVT,
Bob Wilson1f595bb2009-04-17 19:07:39 +000047 CCValAssign::LocInfo &LocInfo,
48 ISD::ArgFlagsTy &ArgFlags,
49 CCState &State);
Bob Wilsondee46d72009-04-17 20:35:10 +000050static bool RetCC_ARM_APCS_Custom_f64(unsigned &ValNo, MVT &ValVT, MVT &LocVT,
Bob Wilson1f595bb2009-04-17 19:07:39 +000051 CCValAssign::LocInfo &LocInfo,
52 ISD::ArgFlagsTy &ArgFlags,
53 CCState &State);
Bob Wilsondee46d72009-04-17 20:35:10 +000054static bool RetCC_ARM_AAPCS_Custom_f64(unsigned &ValNo, MVT &ValVT, MVT &LocVT,
Bob Wilson1f595bb2009-04-17 19:07:39 +000055 CCValAssign::LocInfo &LocInfo,
56 ISD::ArgFlagsTy &ArgFlags,
57 CCState &State);
58
Bob Wilson5bafff32009-06-22 23:27:02 +000059void ARMTargetLowering::addTypeForNEON(MVT VT, MVT PromotedLdStVT,
60 MVT PromotedBitwiseVT) {
61 if (VT != PromotedLdStVT) {
62 setOperationAction(ISD::LOAD, VT, Promote);
63 AddPromotedToType (ISD::LOAD, VT, PromotedLdStVT);
64
65 setOperationAction(ISD::STORE, VT, Promote);
66 AddPromotedToType (ISD::STORE, VT, PromotedLdStVT);
67 }
68
69 MVT ElemTy = VT.getVectorElementType();
70 if (ElemTy != MVT::i64 && ElemTy != MVT::f64)
71 setOperationAction(ISD::VSETCC, VT, Custom);
72 if (ElemTy == MVT::i8 || ElemTy == MVT::i16)
73 setOperationAction(ISD::EXTRACT_VECTOR_ELT, VT, Custom);
74 setOperationAction(ISD::BUILD_VECTOR, VT, Custom);
75 setOperationAction(ISD::VECTOR_SHUFFLE, VT, Custom);
76 setOperationAction(ISD::SCALAR_TO_VECTOR, VT, Custom);
77 setOperationAction(ISD::CONCAT_VECTORS, VT, Custom);
78 if (VT.isInteger()) {
79 setOperationAction(ISD::SHL, VT, Custom);
80 setOperationAction(ISD::SRA, VT, Custom);
81 setOperationAction(ISD::SRL, VT, Custom);
82 }
83
84 // Promote all bit-wise operations.
85 if (VT.isInteger() && VT != PromotedBitwiseVT) {
86 setOperationAction(ISD::AND, VT, Promote);
87 AddPromotedToType (ISD::AND, VT, PromotedBitwiseVT);
88 setOperationAction(ISD::OR, VT, Promote);
89 AddPromotedToType (ISD::OR, VT, PromotedBitwiseVT);
90 setOperationAction(ISD::XOR, VT, Promote);
91 AddPromotedToType (ISD::XOR, VT, PromotedBitwiseVT);
92 }
93}
94
95void ARMTargetLowering::addDRTypeForNEON(MVT VT) {
96 addRegisterClass(VT, ARM::DPRRegisterClass);
97 addTypeForNEON(VT, MVT::f64, MVT::v2i32);
98}
99
100void ARMTargetLowering::addQRTypeForNEON(MVT VT) {
101 addRegisterClass(VT, ARM::QPRRegisterClass);
102 addTypeForNEON(VT, MVT::v2f64, MVT::v4i32);
103}
104
Evan Chenga8e29892007-01-19 07:51:42 +0000105ARMTargetLowering::ARMTargetLowering(TargetMachine &TM)
106 : TargetLowering(TM), ARMPCLabelIndex(0) {
107 Subtarget = &TM.getSubtarget<ARMSubtarget>();
108
Evan Chengb1df8f22007-04-27 08:15:43 +0000109 if (Subtarget->isTargetDarwin()) {
Evan Chengb1df8f22007-04-27 08:15:43 +0000110 // Uses VFP for Thumb libfuncs if available.
111 if (Subtarget->isThumb() && Subtarget->hasVFP2()) {
112 // Single-precision floating-point arithmetic.
113 setLibcallName(RTLIB::ADD_F32, "__addsf3vfp");
114 setLibcallName(RTLIB::SUB_F32, "__subsf3vfp");
115 setLibcallName(RTLIB::MUL_F32, "__mulsf3vfp");
116 setLibcallName(RTLIB::DIV_F32, "__divsf3vfp");
Evan Chenga8e29892007-01-19 07:51:42 +0000117
Evan Chengb1df8f22007-04-27 08:15:43 +0000118 // Double-precision floating-point arithmetic.
119 setLibcallName(RTLIB::ADD_F64, "__adddf3vfp");
120 setLibcallName(RTLIB::SUB_F64, "__subdf3vfp");
121 setLibcallName(RTLIB::MUL_F64, "__muldf3vfp");
122 setLibcallName(RTLIB::DIV_F64, "__divdf3vfp");
Evan Cheng193f8502007-01-31 09:30:58 +0000123
Evan Chengb1df8f22007-04-27 08:15:43 +0000124 // Single-precision comparisons.
125 setLibcallName(RTLIB::OEQ_F32, "__eqsf2vfp");
126 setLibcallName(RTLIB::UNE_F32, "__nesf2vfp");
127 setLibcallName(RTLIB::OLT_F32, "__ltsf2vfp");
128 setLibcallName(RTLIB::OLE_F32, "__lesf2vfp");
129 setLibcallName(RTLIB::OGE_F32, "__gesf2vfp");
130 setLibcallName(RTLIB::OGT_F32, "__gtsf2vfp");
131 setLibcallName(RTLIB::UO_F32, "__unordsf2vfp");
132 setLibcallName(RTLIB::O_F32, "__unordsf2vfp");
Evan Chenga8e29892007-01-19 07:51:42 +0000133
Evan Chengb1df8f22007-04-27 08:15:43 +0000134 setCmpLibcallCC(RTLIB::OEQ_F32, ISD::SETNE);
135 setCmpLibcallCC(RTLIB::UNE_F32, ISD::SETNE);
136 setCmpLibcallCC(RTLIB::OLT_F32, ISD::SETNE);
137 setCmpLibcallCC(RTLIB::OLE_F32, ISD::SETNE);
138 setCmpLibcallCC(RTLIB::OGE_F32, ISD::SETNE);
139 setCmpLibcallCC(RTLIB::OGT_F32, ISD::SETNE);
140 setCmpLibcallCC(RTLIB::UO_F32, ISD::SETNE);
141 setCmpLibcallCC(RTLIB::O_F32, ISD::SETEQ);
Evan Cheng193f8502007-01-31 09:30:58 +0000142
Evan Chengb1df8f22007-04-27 08:15:43 +0000143 // Double-precision comparisons.
144 setLibcallName(RTLIB::OEQ_F64, "__eqdf2vfp");
145 setLibcallName(RTLIB::UNE_F64, "__nedf2vfp");
146 setLibcallName(RTLIB::OLT_F64, "__ltdf2vfp");
147 setLibcallName(RTLIB::OLE_F64, "__ledf2vfp");
148 setLibcallName(RTLIB::OGE_F64, "__gedf2vfp");
149 setLibcallName(RTLIB::OGT_F64, "__gtdf2vfp");
150 setLibcallName(RTLIB::UO_F64, "__unorddf2vfp");
151 setLibcallName(RTLIB::O_F64, "__unorddf2vfp");
Evan Chenga8e29892007-01-19 07:51:42 +0000152
Evan Chengb1df8f22007-04-27 08:15:43 +0000153 setCmpLibcallCC(RTLIB::OEQ_F64, ISD::SETNE);
154 setCmpLibcallCC(RTLIB::UNE_F64, ISD::SETNE);
155 setCmpLibcallCC(RTLIB::OLT_F64, ISD::SETNE);
156 setCmpLibcallCC(RTLIB::OLE_F64, ISD::SETNE);
157 setCmpLibcallCC(RTLIB::OGE_F64, ISD::SETNE);
158 setCmpLibcallCC(RTLIB::OGT_F64, ISD::SETNE);
159 setCmpLibcallCC(RTLIB::UO_F64, ISD::SETNE);
160 setCmpLibcallCC(RTLIB::O_F64, ISD::SETEQ);
Evan Chenga8e29892007-01-19 07:51:42 +0000161
Evan Chengb1df8f22007-04-27 08:15:43 +0000162 // Floating-point to integer conversions.
163 // i64 conversions are done via library routines even when generating VFP
164 // instructions, so use the same ones.
165 setLibcallName(RTLIB::FPTOSINT_F64_I32, "__fixdfsivfp");
166 setLibcallName(RTLIB::FPTOUINT_F64_I32, "__fixunsdfsivfp");
167 setLibcallName(RTLIB::FPTOSINT_F32_I32, "__fixsfsivfp");
168 setLibcallName(RTLIB::FPTOUINT_F32_I32, "__fixunssfsivfp");
Evan Chenga8e29892007-01-19 07:51:42 +0000169
Evan Chengb1df8f22007-04-27 08:15:43 +0000170 // Conversions between floating types.
171 setLibcallName(RTLIB::FPROUND_F64_F32, "__truncdfsf2vfp");
172 setLibcallName(RTLIB::FPEXT_F32_F64, "__extendsfdf2vfp");
173
174 // Integer to floating-point conversions.
175 // i64 conversions are done via library routines even when generating VFP
176 // instructions, so use the same ones.
Bob Wilson2a14c522009-03-20 23:16:43 +0000177 // FIXME: There appears to be some naming inconsistency in ARM libgcc:
178 // e.g., __floatunsidf vs. __floatunssidfvfp.
Evan Chengb1df8f22007-04-27 08:15:43 +0000179 setLibcallName(RTLIB::SINTTOFP_I32_F64, "__floatsidfvfp");
180 setLibcallName(RTLIB::UINTTOFP_I32_F64, "__floatunssidfvfp");
181 setLibcallName(RTLIB::SINTTOFP_I32_F32, "__floatsisfvfp");
182 setLibcallName(RTLIB::UINTTOFP_I32_F32, "__floatunssisfvfp");
183 }
Evan Chenga8e29892007-01-19 07:51:42 +0000184 }
185
Bob Wilson2f954612009-05-22 17:38:41 +0000186 // These libcalls are not available in 32-bit.
187 setLibcallName(RTLIB::SHL_I128, 0);
188 setLibcallName(RTLIB::SRL_I128, 0);
189 setLibcallName(RTLIB::SRA_I128, 0);
190
Jim Grosbach30eae3c2009-04-07 20:34:09 +0000191 if (Subtarget->isThumb())
192 addRegisterClass(MVT::i32, ARM::tGPRRegisterClass);
193 else
194 addRegisterClass(MVT::i32, ARM::GPRRegisterClass);
Evan Chengb6ab2542007-01-31 08:40:13 +0000195 if (!UseSoftFloat && Subtarget->hasVFP2() && !Subtarget->isThumb()) {
Evan Chenga8e29892007-01-19 07:51:42 +0000196 addRegisterClass(MVT::f32, ARM::SPRRegisterClass);
197 addRegisterClass(MVT::f64, ARM::DPRRegisterClass);
Bob Wilson2dc4f542009-03-20 22:42:55 +0000198
Chris Lattnerddf89562008-01-17 19:59:44 +0000199 setTruncStoreAction(MVT::f64, MVT::f32, Expand);
Evan Chenga8e29892007-01-19 07:51:42 +0000200 }
Bob Wilson5bafff32009-06-22 23:27:02 +0000201
202 if (Subtarget->hasNEON()) {
203 addDRTypeForNEON(MVT::v2f32);
204 addDRTypeForNEON(MVT::v8i8);
205 addDRTypeForNEON(MVT::v4i16);
206 addDRTypeForNEON(MVT::v2i32);
207 addDRTypeForNEON(MVT::v1i64);
208
209 addQRTypeForNEON(MVT::v4f32);
210 addQRTypeForNEON(MVT::v2f64);
211 addQRTypeForNEON(MVT::v16i8);
212 addQRTypeForNEON(MVT::v8i16);
213 addQRTypeForNEON(MVT::v4i32);
214 addQRTypeForNEON(MVT::v2i64);
215
216 setTargetDAGCombine(ISD::INTRINSIC_WO_CHAIN);
217 setTargetDAGCombine(ISD::SHL);
218 setTargetDAGCombine(ISD::SRL);
219 setTargetDAGCombine(ISD::SRA);
220 setTargetDAGCombine(ISD::SIGN_EXTEND);
221 setTargetDAGCombine(ISD::ZERO_EXTEND);
222 setTargetDAGCombine(ISD::ANY_EXTEND);
223 }
224
Evan Cheng9f8cbd12007-05-18 00:19:34 +0000225 computeRegisterProperties();
Evan Chenga8e29892007-01-19 07:51:42 +0000226
227 // ARM does not have f32 extending load.
Evan Cheng03294662008-10-14 21:26:46 +0000228 setLoadExtAction(ISD::EXTLOAD, MVT::f32, Expand);
Evan Chenga8e29892007-01-19 07:51:42 +0000229
Duncan Sandsf9c98e62008-01-23 20:39:46 +0000230 // ARM does not have i1 sign extending load.
Evan Cheng03294662008-10-14 21:26:46 +0000231 setLoadExtAction(ISD::SEXTLOAD, MVT::i1, Promote);
Duncan Sandsf9c98e62008-01-23 20:39:46 +0000232
Evan Chenga8e29892007-01-19 07:51:42 +0000233 // ARM supports all 4 flavors of integer indexed load / store.
Evan Chenge88d5ce2009-07-02 07:28:31 +0000234 if (!Subtarget->isThumb1Only()) {
235 for (unsigned im = (unsigned)ISD::PRE_INC;
236 im != (unsigned)ISD::LAST_INDEXED_MODE; ++im) {
237 setIndexedLoadAction(im, MVT::i1, Legal);
238 setIndexedLoadAction(im, MVT::i8, Legal);
239 setIndexedLoadAction(im, MVT::i16, Legal);
240 setIndexedLoadAction(im, MVT::i32, Legal);
241 setIndexedStoreAction(im, MVT::i1, Legal);
242 setIndexedStoreAction(im, MVT::i8, Legal);
243 setIndexedStoreAction(im, MVT::i16, Legal);
244 setIndexedStoreAction(im, MVT::i32, Legal);
245 }
Evan Chenga8e29892007-01-19 07:51:42 +0000246 }
247
248 // i64 operation support.
249 if (Subtarget->isThumb()) {
250 setOperationAction(ISD::MUL, MVT::i64, Expand);
251 setOperationAction(ISD::MULHU, MVT::i32, Expand);
252 setOperationAction(ISD::MULHS, MVT::i32, Expand);
Dan Gohman525178c2007-10-08 18:33:35 +0000253 setOperationAction(ISD::UMUL_LOHI, MVT::i32, Expand);
254 setOperationAction(ISD::SMUL_LOHI, MVT::i32, Expand);
Evan Chenga8e29892007-01-19 07:51:42 +0000255 } else {
Dan Gohman525178c2007-10-08 18:33:35 +0000256 setOperationAction(ISD::MUL, MVT::i64, Expand);
257 setOperationAction(ISD::MULHU, MVT::i32, Expand);
Evan Chenga8e29892007-01-19 07:51:42 +0000258 if (!Subtarget->hasV6Ops())
Dan Gohman525178c2007-10-08 18:33:35 +0000259 setOperationAction(ISD::MULHS, MVT::i32, Expand);
Evan Chenga8e29892007-01-19 07:51:42 +0000260 }
261 setOperationAction(ISD::SHL_PARTS, MVT::i32, Expand);
262 setOperationAction(ISD::SRA_PARTS, MVT::i32, Expand);
263 setOperationAction(ISD::SRL_PARTS, MVT::i32, Expand);
264 setOperationAction(ISD::SRL, MVT::i64, Custom);
265 setOperationAction(ISD::SRA, MVT::i64, Custom);
266
267 // ARM does not have ROTL.
268 setOperationAction(ISD::ROTL, MVT::i32, Expand);
Bob Wilson2dc4f542009-03-20 22:42:55 +0000269 setOperationAction(ISD::CTTZ, MVT::i32, Expand);
Evan Chenga8e29892007-01-19 07:51:42 +0000270 setOperationAction(ISD::CTPOP, MVT::i32, Expand);
David Goodwin24062ac2009-06-26 20:47:43 +0000271 if (!Subtarget->hasV5TOps() || Subtarget->isThumb1Only())
Evan Chenga8e29892007-01-19 07:51:42 +0000272 setOperationAction(ISD::CTLZ, MVT::i32, Expand);
273
Lauro Ramos Venancio368f20f2007-03-16 22:54:16 +0000274 // Only ARMv6 has BSWAP.
275 if (!Subtarget->hasV6Ops())
Chris Lattner1719e132007-03-20 02:25:53 +0000276 setOperationAction(ISD::BSWAP, MVT::i32, Expand);
Lauro Ramos Venancio368f20f2007-03-16 22:54:16 +0000277
Evan Chenga8e29892007-01-19 07:51:42 +0000278 // These are expanded into libcalls.
279 setOperationAction(ISD::SDIV, MVT::i32, Expand);
280 setOperationAction(ISD::UDIV, MVT::i32, Expand);
281 setOperationAction(ISD::SREM, MVT::i32, Expand);
282 setOperationAction(ISD::UREM, MVT::i32, Expand);
Dan Gohman525178c2007-10-08 18:33:35 +0000283 setOperationAction(ISD::SDIVREM, MVT::i32, Expand);
284 setOperationAction(ISD::UDIVREM, MVT::i32, Expand);
Bob Wilson2dc4f542009-03-20 22:42:55 +0000285
Evan Chenga8e29892007-01-19 07:51:42 +0000286 // Support label based line numbers.
Dan Gohman7f460202008-06-30 20:59:49 +0000287 setOperationAction(ISD::DBG_STOPPOINT, MVT::Other, Expand);
Evan Chenga8e29892007-01-19 07:51:42 +0000288 setOperationAction(ISD::DEBUG_LOC, MVT::Other, Expand);
Evan Chenga8e29892007-01-19 07:51:42 +0000289
290 setOperationAction(ISD::RET, MVT::Other, Custom);
291 setOperationAction(ISD::GlobalAddress, MVT::i32, Custom);
292 setOperationAction(ISD::ConstantPool, MVT::i32, Custom);
Lauro Ramos Venancio0ae4a332007-04-22 00:04:12 +0000293 setOperationAction(ISD::GLOBAL_OFFSET_TABLE, MVT::i32, Custom);
Lauro Ramos Venancio64f4fa52007-04-27 13:54:47 +0000294 setOperationAction(ISD::GlobalTLSAddress, MVT::i32, Custom);
Evan Chenga8e29892007-01-19 07:51:42 +0000295
Evan Chenga8e29892007-01-19 07:51:42 +0000296 // Use the default implementation.
Bob Wilson2dc4f542009-03-20 22:42:55 +0000297 setOperationAction(ISD::VASTART, MVT::Other, Custom);
298 setOperationAction(ISD::VAARG, MVT::Other, Expand);
299 setOperationAction(ISD::VACOPY, MVT::Other, Expand);
300 setOperationAction(ISD::VAEND, MVT::Other, Expand);
301 setOperationAction(ISD::STACKSAVE, MVT::Other, Expand);
Evan Chenga8e29892007-01-19 07:51:42 +0000302 setOperationAction(ISD::STACKRESTORE, MVT::Other, Expand);
Bob Wilson2dc4f542009-03-20 22:42:55 +0000303 setOperationAction(ISD::DYNAMIC_STACKALLOC, MVT::i32, Expand);
304 setOperationAction(ISD::MEMBARRIER, MVT::Other, Expand);
Evan Chenga8e29892007-01-19 07:51:42 +0000305
Evan Chengd27c9fc2009-07-03 01:43:10 +0000306 if (!Subtarget->hasV6Ops() && !Subtarget->isThumb2()) {
Evan Chenga8e29892007-01-19 07:51:42 +0000307 setOperationAction(ISD::SIGN_EXTEND_INREG, MVT::i16, Expand);
308 setOperationAction(ISD::SIGN_EXTEND_INREG, MVT::i8, Expand);
309 }
310 setOperationAction(ISD::SIGN_EXTEND_INREG, MVT::i1, Expand);
311
Evan Chengb6ab2542007-01-31 08:40:13 +0000312 if (!UseSoftFloat && Subtarget->hasVFP2() && !Subtarget->isThumb())
Evan Chengc7c77292008-11-04 19:57:48 +0000313 // Turn f64->i64 into FMRRD, i64 -> f64 to FMDRR iff target supports vfp2.
Evan Chenga8e29892007-01-19 07:51:42 +0000314 setOperationAction(ISD::BIT_CONVERT, MVT::i64, Custom);
Lauro Ramos Venancioe0cb36b2007-11-08 17:20:05 +0000315
316 // We want to custom lower some of our intrinsics.
317 setOperationAction(ISD::INTRINSIC_WO_CHAIN, MVT::Other, Custom);
318
Bob Wilson2dc4f542009-03-20 22:42:55 +0000319 setOperationAction(ISD::SETCC, MVT::i32, Expand);
320 setOperationAction(ISD::SETCC, MVT::f32, Expand);
321 setOperationAction(ISD::SETCC, MVT::f64, Expand);
322 setOperationAction(ISD::SELECT, MVT::i32, Expand);
323 setOperationAction(ISD::SELECT, MVT::f32, Expand);
324 setOperationAction(ISD::SELECT, MVT::f64, Expand);
Evan Chenga8e29892007-01-19 07:51:42 +0000325 setOperationAction(ISD::SELECT_CC, MVT::i32, Custom);
326 setOperationAction(ISD::SELECT_CC, MVT::f32, Custom);
327 setOperationAction(ISD::SELECT_CC, MVT::f64, Custom);
328
Bob Wilson2dc4f542009-03-20 22:42:55 +0000329 setOperationAction(ISD::BRCOND, MVT::Other, Expand);
330 setOperationAction(ISD::BR_CC, MVT::i32, Custom);
331 setOperationAction(ISD::BR_CC, MVT::f32, Custom);
332 setOperationAction(ISD::BR_CC, MVT::f64, Custom);
333 setOperationAction(ISD::BR_JT, MVT::Other, Custom);
Evan Chenga8e29892007-01-19 07:51:42 +0000334
Dan Gohmanf96e4de2007-10-11 23:21:31 +0000335 // We don't support sin/cos/fmod/copysign/pow
Bob Wilson2dc4f542009-03-20 22:42:55 +0000336 setOperationAction(ISD::FSIN, MVT::f64, Expand);
337 setOperationAction(ISD::FSIN, MVT::f32, Expand);
338 setOperationAction(ISD::FCOS, MVT::f32, Expand);
339 setOperationAction(ISD::FCOS, MVT::f64, Expand);
340 setOperationAction(ISD::FREM, MVT::f64, Expand);
341 setOperationAction(ISD::FREM, MVT::f32, Expand);
Evan Cheng110cf482008-04-01 01:50:16 +0000342 if (!UseSoftFloat && Subtarget->hasVFP2() && !Subtarget->isThumb()) {
343 setOperationAction(ISD::FCOPYSIGN, MVT::f64, Custom);
344 setOperationAction(ISD::FCOPYSIGN, MVT::f32, Custom);
345 }
Bob Wilson2dc4f542009-03-20 22:42:55 +0000346 setOperationAction(ISD::FPOW, MVT::f64, Expand);
347 setOperationAction(ISD::FPOW, MVT::f32, Expand);
348
Evan Chenga8e29892007-01-19 07:51:42 +0000349 // int <-> fp are custom expanded into bit_convert + ARMISD ops.
Evan Cheng110cf482008-04-01 01:50:16 +0000350 if (!UseSoftFloat && Subtarget->hasVFP2() && !Subtarget->isThumb()) {
351 setOperationAction(ISD::SINT_TO_FP, MVT::i32, Custom);
352 setOperationAction(ISD::UINT_TO_FP, MVT::i32, Custom);
353 setOperationAction(ISD::FP_TO_UINT, MVT::i32, Custom);
354 setOperationAction(ISD::FP_TO_SINT, MVT::i32, Custom);
355 }
Evan Chenga8e29892007-01-19 07:51:42 +0000356
Chris Lattnerf1b1c5e2007-11-27 22:36:16 +0000357 // We have target-specific dag combine patterns for the following nodes:
358 // ARMISD::FMRRD - No need to call setTargetDAGCombine
Chris Lattnerd1980a52009-03-12 06:52:53 +0000359 setTargetDAGCombine(ISD::ADD);
360 setTargetDAGCombine(ISD::SUB);
Bob Wilson2dc4f542009-03-20 22:42:55 +0000361
Evan Chenga8e29892007-01-19 07:51:42 +0000362 setStackPointerRegisterToSaveRestore(ARM::SP);
Evan Chenga8e29892007-01-19 07:51:42 +0000363 setSchedulingPreference(SchedulingForRegPressure);
Evan Cheng9f8cbd12007-05-18 00:19:34 +0000364 setIfCvtBlockSizeLimit(Subtarget->isThumb() ? 0 : 10);
Evan Cheng97e604e2007-06-19 23:55:02 +0000365 setIfCvtDupBlockSizeLimit(Subtarget->isThumb() ? 0 : 2);
Dale Johannesen8dd86c12007-05-17 21:31:21 +0000366
Evan Cheng8557c2b2009-06-19 01:51:50 +0000367 if (!Subtarget->isThumb()) {
368 // Use branch latency information to determine if-conversion limits.
Evan Chengb1019482009-06-19 07:06:07 +0000369 // FIXME: If-converter should use instruction latency of the branch being
370 // eliminated to compute the threshold. For ARMv6, the branch "latency"
371 // varies depending on whether it's dynamically or statically predicted
372 // and on whether the destination is in the prefetch buffer.
Evan Cheng8557c2b2009-06-19 01:51:50 +0000373 const TargetInstrInfo *TII = getTargetMachine().getInstrInfo();
374 const InstrItineraryData &InstrItins = Subtarget->getInstrItineraryData();
Evan Cheng7a42b082009-06-19 06:56:26 +0000375 unsigned Latency= InstrItins.getLatency(TII->get(ARM::Bcc).getSchedClass());
Evan Cheng8557c2b2009-06-19 01:51:50 +0000376 if (Latency > 1) {
377 setIfCvtBlockSizeLimit(Latency-1);
378 if (Latency > 2)
379 setIfCvtDupBlockSizeLimit(Latency-2);
380 } else {
381 setIfCvtBlockSizeLimit(10);
382 setIfCvtDupBlockSizeLimit(2);
383 }
384 }
385
Dale Johannesen8dd86c12007-05-17 21:31:21 +0000386 maxStoresPerMemcpy = 1; //// temporary - rewrite interface to use type
Bob Wilsone6abdff2009-05-18 20:55:32 +0000387 // Do not enable CodePlacementOpt for now: it currently runs after the
388 // ARMConstantIslandPass and messes up branch relaxation and placement
389 // of constant islands.
390 // benefitFromCodePlacementOpt = true;
Evan Chenga8e29892007-01-19 07:51:42 +0000391}
392
Evan Chenga8e29892007-01-19 07:51:42 +0000393const char *ARMTargetLowering::getTargetNodeName(unsigned Opcode) const {
394 switch (Opcode) {
395 default: return 0;
396 case ARMISD::Wrapper: return "ARMISD::Wrapper";
Evan Chenga8e29892007-01-19 07:51:42 +0000397 case ARMISD::WrapperJT: return "ARMISD::WrapperJT";
398 case ARMISD::CALL: return "ARMISD::CALL";
Evan Cheng277f0742007-06-19 21:05:09 +0000399 case ARMISD::CALL_PRED: return "ARMISD::CALL_PRED";
Evan Chenga8e29892007-01-19 07:51:42 +0000400 case ARMISD::CALL_NOLINK: return "ARMISD::CALL_NOLINK";
401 case ARMISD::tCALL: return "ARMISD::tCALL";
402 case ARMISD::BRCOND: return "ARMISD::BRCOND";
403 case ARMISD::BR_JT: return "ARMISD::BR_JT";
404 case ARMISD::RET_FLAG: return "ARMISD::RET_FLAG";
405 case ARMISD::PIC_ADD: return "ARMISD::PIC_ADD";
406 case ARMISD::CMP: return "ARMISD::CMP";
David Goodwinc0309b42009-06-29 15:33:01 +0000407 case ARMISD::CMPZ: return "ARMISD::CMPZ";
Evan Chenga8e29892007-01-19 07:51:42 +0000408 case ARMISD::CMPFP: return "ARMISD::CMPFP";
409 case ARMISD::CMPFPw0: return "ARMISD::CMPFPw0";
410 case ARMISD::FMSTAT: return "ARMISD::FMSTAT";
411 case ARMISD::CMOV: return "ARMISD::CMOV";
412 case ARMISD::CNEG: return "ARMISD::CNEG";
Bob Wilson2dc4f542009-03-20 22:42:55 +0000413
Evan Chenga8e29892007-01-19 07:51:42 +0000414 case ARMISD::FTOSI: return "ARMISD::FTOSI";
415 case ARMISD::FTOUI: return "ARMISD::FTOUI";
416 case ARMISD::SITOF: return "ARMISD::SITOF";
417 case ARMISD::UITOF: return "ARMISD::UITOF";
Evan Chenga8e29892007-01-19 07:51:42 +0000418
419 case ARMISD::SRL_FLAG: return "ARMISD::SRL_FLAG";
420 case ARMISD::SRA_FLAG: return "ARMISD::SRA_FLAG";
421 case ARMISD::RRX: return "ARMISD::RRX";
Bob Wilson2dc4f542009-03-20 22:42:55 +0000422
Evan Chenga8e29892007-01-19 07:51:42 +0000423 case ARMISD::FMRRD: return "ARMISD::FMRRD";
424 case ARMISD::FMDRR: return "ARMISD::FMDRR";
Lauro Ramos Venancio64f4fa52007-04-27 13:54:47 +0000425
426 case ARMISD::THREAD_POINTER:return "ARMISD::THREAD_POINTER";
Bob Wilson5bafff32009-06-22 23:27:02 +0000427
428 case ARMISD::VCEQ: return "ARMISD::VCEQ";
429 case ARMISD::VCGE: return "ARMISD::VCGE";
430 case ARMISD::VCGEU: return "ARMISD::VCGEU";
431 case ARMISD::VCGT: return "ARMISD::VCGT";
432 case ARMISD::VCGTU: return "ARMISD::VCGTU";
433 case ARMISD::VTST: return "ARMISD::VTST";
434
435 case ARMISD::VSHL: return "ARMISD::VSHL";
436 case ARMISD::VSHRs: return "ARMISD::VSHRs";
437 case ARMISD::VSHRu: return "ARMISD::VSHRu";
438 case ARMISD::VSHLLs: return "ARMISD::VSHLLs";
439 case ARMISD::VSHLLu: return "ARMISD::VSHLLu";
440 case ARMISD::VSHLLi: return "ARMISD::VSHLLi";
441 case ARMISD::VSHRN: return "ARMISD::VSHRN";
442 case ARMISD::VRSHRs: return "ARMISD::VRSHRs";
443 case ARMISD::VRSHRu: return "ARMISD::VRSHRu";
444 case ARMISD::VRSHRN: return "ARMISD::VRSHRN";
445 case ARMISD::VQSHLs: return "ARMISD::VQSHLs";
446 case ARMISD::VQSHLu: return "ARMISD::VQSHLu";
447 case ARMISD::VQSHLsu: return "ARMISD::VQSHLsu";
448 case ARMISD::VQSHRNs: return "ARMISD::VQSHRNs";
449 case ARMISD::VQSHRNu: return "ARMISD::VQSHRNu";
450 case ARMISD::VQSHRNsu: return "ARMISD::VQSHRNsu";
451 case ARMISD::VQRSHRNs: return "ARMISD::VQRSHRNs";
452 case ARMISD::VQRSHRNu: return "ARMISD::VQRSHRNu";
453 case ARMISD::VQRSHRNsu: return "ARMISD::VQRSHRNsu";
454 case ARMISD::VGETLANEu: return "ARMISD::VGETLANEu";
455 case ARMISD::VGETLANEs: return "ARMISD::VGETLANEs";
456 case ARMISD::VDUPLANEQ: return "ARMISD::VDUPLANEQ";
Evan Chenga8e29892007-01-19 07:51:42 +0000457 }
458}
459
Bill Wendlingb4202b82009-07-01 18:50:55 +0000460/// getFunctionAlignment - Return the Log2 alignment of this function.
Bill Wendling20c568f2009-06-30 22:38:32 +0000461unsigned ARMTargetLowering::getFunctionAlignment(const Function *F) const {
462 return getTargetMachine().getSubtarget<ARMSubtarget>().isThumb() ? 1 : 2;
463}
464
Evan Chenga8e29892007-01-19 07:51:42 +0000465//===----------------------------------------------------------------------===//
466// Lowering Code
467//===----------------------------------------------------------------------===//
468
Evan Chenga8e29892007-01-19 07:51:42 +0000469/// IntCCToARMCC - Convert a DAG integer condition code to an ARM CC
470static ARMCC::CondCodes IntCCToARMCC(ISD::CondCode CC) {
471 switch (CC) {
472 default: assert(0 && "Unknown condition code!");
473 case ISD::SETNE: return ARMCC::NE;
474 case ISD::SETEQ: return ARMCC::EQ;
475 case ISD::SETGT: return ARMCC::GT;
476 case ISD::SETGE: return ARMCC::GE;
477 case ISD::SETLT: return ARMCC::LT;
478 case ISD::SETLE: return ARMCC::LE;
479 case ISD::SETUGT: return ARMCC::HI;
480 case ISD::SETUGE: return ARMCC::HS;
481 case ISD::SETULT: return ARMCC::LO;
482 case ISD::SETULE: return ARMCC::LS;
483 }
484}
485
486/// FPCCToARMCC - Convert a DAG fp condition code to an ARM CC. It
487/// returns true if the operands should be inverted to form the proper
488/// comparison.
489static bool FPCCToARMCC(ISD::CondCode CC, ARMCC::CondCodes &CondCode,
490 ARMCC::CondCodes &CondCode2) {
491 bool Invert = false;
492 CondCode2 = ARMCC::AL;
493 switch (CC) {
494 default: assert(0 && "Unknown FP condition!");
495 case ISD::SETEQ:
496 case ISD::SETOEQ: CondCode = ARMCC::EQ; break;
497 case ISD::SETGT:
498 case ISD::SETOGT: CondCode = ARMCC::GT; break;
499 case ISD::SETGE:
500 case ISD::SETOGE: CondCode = ARMCC::GE; break;
501 case ISD::SETOLT: CondCode = ARMCC::MI; break;
502 case ISD::SETOLE: CondCode = ARMCC::GT; Invert = true; break;
503 case ISD::SETONE: CondCode = ARMCC::MI; CondCode2 = ARMCC::GT; break;
504 case ISD::SETO: CondCode = ARMCC::VC; break;
505 case ISD::SETUO: CondCode = ARMCC::VS; break;
506 case ISD::SETUEQ: CondCode = ARMCC::EQ; CondCode2 = ARMCC::VS; break;
507 case ISD::SETUGT: CondCode = ARMCC::HI; break;
508 case ISD::SETUGE: CondCode = ARMCC::PL; break;
509 case ISD::SETLT:
510 case ISD::SETULT: CondCode = ARMCC::LT; break;
511 case ISD::SETLE:
512 case ISD::SETULE: CondCode = ARMCC::LE; break;
513 case ISD::SETNE:
514 case ISD::SETUNE: CondCode = ARMCC::NE; break;
515 }
516 return Invert;
517}
518
Bob Wilson1f595bb2009-04-17 19:07:39 +0000519//===----------------------------------------------------------------------===//
520// Calling Convention Implementation
521//
522// The lower operations present on calling convention works on this order:
523// LowerCALL (virt regs --> phys regs, virt regs --> stack)
524// LowerFORMAL_ARGUMENTS (phys --> virt regs, stack --> virt regs)
525// LowerRET (virt regs --> phys regs)
526// LowerCALL (phys regs --> virt regs)
527//
528//===----------------------------------------------------------------------===//
529
530#include "ARMGenCallingConv.inc"
531
532// APCS f64 is in register pairs, possibly split to stack
Bob Wilson5bafff32009-06-22 23:27:02 +0000533static bool f64AssignAPCS(unsigned &ValNo, MVT &ValVT, MVT &LocVT,
534 CCValAssign::LocInfo &LocInfo,
535 CCState &State, bool CanFail) {
536 static const unsigned RegList[] = { ARM::R0, ARM::R1, ARM::R2, ARM::R3 };
537
538 // Try to get the first register.
539 if (unsigned Reg = State.AllocateReg(RegList, 4))
540 State.addLoc(CCValAssign::getCustomReg(ValNo, ValVT, Reg, LocVT, LocInfo));
541 else {
542 // For the 2nd half of a v2f64, do not fail.
543 if (CanFail)
544 return false;
545
546 // Put the whole thing on the stack.
547 State.addLoc(CCValAssign::getCustomMem(ValNo, ValVT,
548 State.AllocateStack(8, 4),
549 LocVT, LocInfo));
550 return true;
551 }
552
553 // Try to get the second register.
554 if (unsigned Reg = State.AllocateReg(RegList, 4))
555 State.addLoc(CCValAssign::getCustomReg(ValNo, ValVT, Reg, LocVT, LocInfo));
556 else
557 State.addLoc(CCValAssign::getCustomMem(ValNo, ValVT,
558 State.AllocateStack(4, 4),
559 LocVT, LocInfo));
560 return true;
561}
562
Bob Wilsondee46d72009-04-17 20:35:10 +0000563static bool CC_ARM_APCS_Custom_f64(unsigned &ValNo, MVT &ValVT, MVT &LocVT,
Bob Wilson1f595bb2009-04-17 19:07:39 +0000564 CCValAssign::LocInfo &LocInfo,
565 ISD::ArgFlagsTy &ArgFlags,
566 CCState &State) {
Bob Wilson5bafff32009-06-22 23:27:02 +0000567 if (!f64AssignAPCS(ValNo, ValVT, LocVT, LocInfo, State, true))
568 return false;
569 if (LocVT == MVT::v2f64 &&
570 !f64AssignAPCS(ValNo, ValVT, LocVT, LocInfo, State, false))
571 return false;
Bob Wilsone65586b2009-04-17 20:40:45 +0000572 return true; // we handled it
Bob Wilson1f595bb2009-04-17 19:07:39 +0000573}
574
575// AAPCS f64 is in aligned register pairs
Bob Wilson5bafff32009-06-22 23:27:02 +0000576static bool f64AssignAAPCS(unsigned &ValNo, MVT &ValVT, MVT &LocVT,
577 CCValAssign::LocInfo &LocInfo,
578 CCState &State, bool CanFail) {
579 static const unsigned HiRegList[] = { ARM::R0, ARM::R2 };
580 static const unsigned LoRegList[] = { ARM::R1, ARM::R3 };
581
582 unsigned Reg = State.AllocateReg(HiRegList, LoRegList, 2);
583 if (Reg == 0) {
584 // For the 2nd half of a v2f64, do not just fail.
585 if (CanFail)
586 return false;
587
588 // Put the whole thing on the stack.
589 State.addLoc(CCValAssign::getCustomMem(ValNo, ValVT,
590 State.AllocateStack(8, 8),
591 LocVT, LocInfo));
592 return true;
593 }
594
595 unsigned i;
596 for (i = 0; i < 2; ++i)
597 if (HiRegList[i] == Reg)
598 break;
599
600 State.addLoc(CCValAssign::getCustomReg(ValNo, ValVT, Reg, LocVT, LocInfo));
601 State.addLoc(CCValAssign::getCustomReg(ValNo, ValVT, LoRegList[i],
602 LocVT, LocInfo));
603 return true;
604}
605
Bob Wilsondee46d72009-04-17 20:35:10 +0000606static bool CC_ARM_AAPCS_Custom_f64(unsigned &ValNo, MVT &ValVT, MVT &LocVT,
Bob Wilson1f595bb2009-04-17 19:07:39 +0000607 CCValAssign::LocInfo &LocInfo,
608 ISD::ArgFlagsTy &ArgFlags,
609 CCState &State) {
Bob Wilson5bafff32009-06-22 23:27:02 +0000610 if (!f64AssignAAPCS(ValNo, ValVT, LocVT, LocInfo, State, true))
611 return false;
612 if (LocVT == MVT::v2f64 &&
613 !f64AssignAAPCS(ValNo, ValVT, LocVT, LocInfo, State, false))
614 return false;
615 return true; // we handled it
616}
617
618static bool f64RetAssign(unsigned &ValNo, MVT &ValVT, MVT &LocVT,
619 CCValAssign::LocInfo &LocInfo, CCState &State) {
Bob Wilson1f595bb2009-04-17 19:07:39 +0000620 static const unsigned HiRegList[] = { ARM::R0, ARM::R2 };
621 static const unsigned LoRegList[] = { ARM::R1, ARM::R3 };
622
Bob Wilsone65586b2009-04-17 20:40:45 +0000623 unsigned Reg = State.AllocateReg(HiRegList, LoRegList, 2);
624 if (Reg == 0)
625 return false; // we didn't handle it
Bob Wilson1f595bb2009-04-17 19:07:39 +0000626
Bob Wilsone65586b2009-04-17 20:40:45 +0000627 unsigned i;
628 for (i = 0; i < 2; ++i)
629 if (HiRegList[i] == Reg)
630 break;
Bob Wilson1f595bb2009-04-17 19:07:39 +0000631
Bob Wilson5bafff32009-06-22 23:27:02 +0000632 State.addLoc(CCValAssign::getCustomReg(ValNo, ValVT, Reg, LocVT, LocInfo));
Bob Wilsone65586b2009-04-17 20:40:45 +0000633 State.addLoc(CCValAssign::getCustomReg(ValNo, ValVT, LoRegList[i],
Bob Wilson5bafff32009-06-22 23:27:02 +0000634 LocVT, LocInfo));
635 return true;
Bob Wilson1f595bb2009-04-17 19:07:39 +0000636}
637
Bob Wilsondee46d72009-04-17 20:35:10 +0000638static bool RetCC_ARM_APCS_Custom_f64(unsigned &ValNo, MVT &ValVT, MVT &LocVT,
Bob Wilson1f595bb2009-04-17 19:07:39 +0000639 CCValAssign::LocInfo &LocInfo,
640 ISD::ArgFlagsTy &ArgFlags,
641 CCState &State) {
Bob Wilson5bafff32009-06-22 23:27:02 +0000642 if (!f64RetAssign(ValNo, ValVT, LocVT, LocInfo, State))
643 return false;
644 if (LocVT == MVT::v2f64 && !f64RetAssign(ValNo, ValVT, LocVT, LocInfo, State))
645 return false;
Bob Wilsone65586b2009-04-17 20:40:45 +0000646 return true; // we handled it
Bob Wilson1f595bb2009-04-17 19:07:39 +0000647}
648
Bob Wilsondee46d72009-04-17 20:35:10 +0000649static bool RetCC_ARM_AAPCS_Custom_f64(unsigned &ValNo, MVT &ValVT, MVT &LocVT,
Bob Wilson1f595bb2009-04-17 19:07:39 +0000650 CCValAssign::LocInfo &LocInfo,
651 ISD::ArgFlagsTy &ArgFlags,
652 CCState &State) {
653 return RetCC_ARM_APCS_Custom_f64(ValNo, ValVT, LocVT, LocInfo, ArgFlags,
654 State);
655}
656
Anton Korobeynikov385f5a92009-06-16 18:50:49 +0000657/// CCAssignFnForNode - Selects the correct CCAssignFn for a the
658/// given CallingConvention value.
659CCAssignFn *ARMTargetLowering::CCAssignFnForNode(unsigned CC,
660 bool Return) const {
661 switch (CC) {
662 default:
663 assert(0 && "Unsupported calling convention");
664 case CallingConv::C:
665 case CallingConv::Fast:
666 // Use target triple & subtarget features to do actual dispatch.
667 if (Subtarget->isAAPCS_ABI()) {
668 if (Subtarget->hasVFP2() &&
669 FloatABIType == FloatABI::Hard)
670 return (Return ? RetCC_ARM_AAPCS_VFP: CC_ARM_AAPCS_VFP);
671 else
672 return (Return ? RetCC_ARM_AAPCS: CC_ARM_AAPCS);
673 } else
674 return (Return ? RetCC_ARM_APCS: CC_ARM_APCS);
675 case CallingConv::ARM_AAPCS_VFP:
676 return (Return ? RetCC_ARM_AAPCS_VFP: CC_ARM_AAPCS_VFP);
677 case CallingConv::ARM_AAPCS:
678 return (Return ? RetCC_ARM_AAPCS: CC_ARM_AAPCS);
679 case CallingConv::ARM_APCS:
680 return (Return ? RetCC_ARM_APCS: CC_ARM_APCS);
681 }
682}
683
Bob Wilson1f595bb2009-04-17 19:07:39 +0000684/// LowerCallResult - Lower the result values of an ISD::CALL into the
685/// appropriate copies out of appropriate physical registers. This assumes that
686/// Chain/InFlag are the input chain/flag to use, and that TheCall is the call
687/// being lowered. The returns a SDNode with the same number of values as the
688/// ISD::CALL.
689SDNode *ARMTargetLowering::
690LowerCallResult(SDValue Chain, SDValue InFlag, CallSDNode *TheCall,
691 unsigned CallingConv, SelectionDAG &DAG) {
692
693 DebugLoc dl = TheCall->getDebugLoc();
694 // Assign locations to each value returned by this call.
695 SmallVector<CCValAssign, 16> RVLocs;
696 bool isVarArg = TheCall->isVarArg();
697 CCState CCInfo(CallingConv, isVarArg, getTargetMachine(), RVLocs);
Anton Korobeynikov385f5a92009-06-16 18:50:49 +0000698 CCInfo.AnalyzeCallResult(TheCall,
699 CCAssignFnForNode(CallingConv, /* Return*/ true));
Bob Wilson1f595bb2009-04-17 19:07:39 +0000700
701 SmallVector<SDValue, 8> ResultVals;
702
703 // Copy all of the result registers out of their specified physreg.
704 for (unsigned i = 0; i != RVLocs.size(); ++i) {
705 CCValAssign VA = RVLocs[i];
706
Bob Wilson80915242009-04-25 00:33:20 +0000707 SDValue Val;
Bob Wilson1f595bb2009-04-17 19:07:39 +0000708 if (VA.needsCustom()) {
Bob Wilson5bafff32009-06-22 23:27:02 +0000709 // Handle f64 or half of a v2f64.
Bob Wilson80915242009-04-25 00:33:20 +0000710 SDValue Lo = DAG.getCopyFromReg(Chain, dl, VA.getLocReg(), MVT::i32,
Bob Wilson1f595bb2009-04-17 19:07:39 +0000711 InFlag);
Bob Wilson4d59e1d2009-04-24 17:00:36 +0000712 Chain = Lo.getValue(1);
713 InFlag = Lo.getValue(2);
Bob Wilson1f595bb2009-04-17 19:07:39 +0000714 VA = RVLocs[++i]; // skip ahead to next loc
Bob Wilson80915242009-04-25 00:33:20 +0000715 SDValue Hi = DAG.getCopyFromReg(Chain, dl, VA.getLocReg(), MVT::i32,
Bob Wilson4d59e1d2009-04-24 17:00:36 +0000716 InFlag);
717 Chain = Hi.getValue(1);
718 InFlag = Hi.getValue(2);
Bob Wilson80915242009-04-25 00:33:20 +0000719 Val = DAG.getNode(ARMISD::FMDRR, dl, MVT::f64, Lo, Hi);
Bob Wilson5bafff32009-06-22 23:27:02 +0000720
721 if (VA.getLocVT() == MVT::v2f64) {
722 SDValue Vec = DAG.getNode(ISD::UNDEF, dl, MVT::v2f64);
723 Vec = DAG.getNode(ISD::INSERT_VECTOR_ELT, dl, MVT::v2f64, Vec, Val,
724 DAG.getConstant(0, MVT::i32));
725
726 VA = RVLocs[++i]; // skip ahead to next loc
727 Lo = DAG.getCopyFromReg(Chain, dl, VA.getLocReg(), MVT::i32, InFlag);
728 Chain = Lo.getValue(1);
729 InFlag = Lo.getValue(2);
730 VA = RVLocs[++i]; // skip ahead to next loc
731 Hi = DAG.getCopyFromReg(Chain, dl, VA.getLocReg(), MVT::i32, InFlag);
732 Chain = Hi.getValue(1);
733 InFlag = Hi.getValue(2);
734 Val = DAG.getNode(ARMISD::FMDRR, dl, MVT::f64, Lo, Hi);
735 Val = DAG.getNode(ISD::INSERT_VECTOR_ELT, dl, MVT::v2f64, Vec, Val,
736 DAG.getConstant(1, MVT::i32));
737 }
Bob Wilson1f595bb2009-04-17 19:07:39 +0000738 } else {
Bob Wilson80915242009-04-25 00:33:20 +0000739 Val = DAG.getCopyFromReg(Chain, dl, VA.getLocReg(), VA.getLocVT(),
740 InFlag);
Bob Wilson4d59e1d2009-04-24 17:00:36 +0000741 Chain = Val.getValue(1);
742 InFlag = Val.getValue(2);
Bob Wilson1f595bb2009-04-17 19:07:39 +0000743 }
Bob Wilson80915242009-04-25 00:33:20 +0000744
745 switch (VA.getLocInfo()) {
746 default: assert(0 && "Unknown loc info!");
747 case CCValAssign::Full: break;
748 case CCValAssign::BCvt:
749 Val = DAG.getNode(ISD::BIT_CONVERT, dl, VA.getValVT(), Val);
750 break;
751 }
752
753 ResultVals.push_back(Val);
Bob Wilson1f595bb2009-04-17 19:07:39 +0000754 }
755
756 // Merge everything together with a MERGE_VALUES node.
757 ResultVals.push_back(Chain);
758 return DAG.getNode(ISD::MERGE_VALUES, dl, TheCall->getVTList(),
759 &ResultVals[0], ResultVals.size()).getNode();
760}
761
762/// CreateCopyOfByValArgument - Make a copy of an aggregate at address specified
763/// by "Src" to address "Dst" of size "Size". Alignment information is
Bob Wilsondee46d72009-04-17 20:35:10 +0000764/// specified by the specific parameter attribute. The copy will be passed as
Bob Wilson1f595bb2009-04-17 19:07:39 +0000765/// a byval function parameter.
766/// Sometimes what we are copying is the end of a larger object, the part that
767/// does not fit in registers.
768static SDValue
769CreateCopyOfByValArgument(SDValue Src, SDValue Dst, SDValue Chain,
770 ISD::ArgFlagsTy Flags, SelectionDAG &DAG,
771 DebugLoc dl) {
772 SDValue SizeNode = DAG.getConstant(Flags.getByValSize(), MVT::i32);
773 return DAG.getMemcpy(Chain, dl, Dst, Src, SizeNode, Flags.getByValAlign(),
774 /*AlwaysInline=*/false, NULL, 0, NULL, 0);
775}
776
Bob Wilsondee46d72009-04-17 20:35:10 +0000777/// LowerMemOpCallTo - Store the argument to the stack.
Bob Wilson1f595bb2009-04-17 19:07:39 +0000778SDValue
779ARMTargetLowering::LowerMemOpCallTo(CallSDNode *TheCall, SelectionDAG &DAG,
780 const SDValue &StackPtr,
Bob Wilsondee46d72009-04-17 20:35:10 +0000781 const CCValAssign &VA, SDValue Chain,
Bob Wilson1f595bb2009-04-17 19:07:39 +0000782 SDValue Arg, ISD::ArgFlagsTy Flags) {
783 DebugLoc dl = TheCall->getDebugLoc();
784 unsigned LocMemOffset = VA.getLocMemOffset();
785 SDValue PtrOff = DAG.getIntPtrConstant(LocMemOffset);
786 PtrOff = DAG.getNode(ISD::ADD, dl, getPointerTy(), StackPtr, PtrOff);
787 if (Flags.isByVal()) {
788 return CreateCopyOfByValArgument(Arg, PtrOff, Chain, Flags, DAG, dl);
789 }
790 return DAG.getStore(Chain, dl, Arg, PtrOff,
791 PseudoSourceValue::getStack(), LocMemOffset);
Evan Chenga8e29892007-01-19 07:51:42 +0000792}
793
Bob Wilson5bafff32009-06-22 23:27:02 +0000794void ARMTargetLowering::PassF64ArgInRegs(CallSDNode *TheCall, SelectionDAG &DAG,
795 SDValue Chain, SDValue &Arg,
796 RegsToPassVector &RegsToPass,
797 CCValAssign &VA, CCValAssign &NextVA,
798 SDValue &StackPtr,
799 SmallVector<SDValue, 8> &MemOpChains,
800 ISD::ArgFlagsTy Flags) {
801 DebugLoc dl = TheCall->getDebugLoc();
802
803 SDValue fmrrd = DAG.getNode(ARMISD::FMRRD, dl,
804 DAG.getVTList(MVT::i32, MVT::i32), Arg);
805 RegsToPass.push_back(std::make_pair(VA.getLocReg(), fmrrd));
806
807 if (NextVA.isRegLoc())
808 RegsToPass.push_back(std::make_pair(NextVA.getLocReg(), fmrrd.getValue(1)));
809 else {
810 assert(NextVA.isMemLoc());
811 if (StackPtr.getNode() == 0)
812 StackPtr = DAG.getCopyFromReg(Chain, dl, ARM::SP, getPointerTy());
813
814 MemOpChains.push_back(LowerMemOpCallTo(TheCall, DAG, StackPtr, NextVA,
815 Chain, fmrrd.getValue(1), Flags));
816 }
817}
818
Evan Chengfc403422007-02-03 08:53:01 +0000819/// LowerCALL - Lowering a ISD::CALL node into a callseq_start <-
820/// ARMISD:CALL <- callseq_end chain. Also add input and output parameter
821/// nodes.
Dan Gohman475871a2008-07-27 21:46:04 +0000822SDValue ARMTargetLowering::LowerCALL(SDValue Op, SelectionDAG &DAG) {
Dan Gohman095cc292008-09-13 01:54:27 +0000823 CallSDNode *TheCall = cast<CallSDNode>(Op.getNode());
Bob Wilson1f595bb2009-04-17 19:07:39 +0000824 MVT RetVT = TheCall->getRetValType(0);
825 SDValue Chain = TheCall->getChain();
826 unsigned CC = TheCall->getCallingConv();
Bob Wilson1f595bb2009-04-17 19:07:39 +0000827 bool isVarArg = TheCall->isVarArg();
828 SDValue Callee = TheCall->getCallee();
829 DebugLoc dl = TheCall->getDebugLoc();
Evan Chenga8e29892007-01-19 07:51:42 +0000830
Bob Wilson1f595bb2009-04-17 19:07:39 +0000831 // Analyze operands of the call, assigning locations to each operand.
832 SmallVector<CCValAssign, 16> ArgLocs;
833 CCState CCInfo(CC, isVarArg, getTargetMachine(), ArgLocs);
Anton Korobeynikov385f5a92009-06-16 18:50:49 +0000834 CCInfo.AnalyzeCallOperands(TheCall, CCAssignFnForNode(CC, /* Return*/ false));
Evan Chenga8e29892007-01-19 07:51:42 +0000835
Bob Wilson1f595bb2009-04-17 19:07:39 +0000836 // Get a count of how many bytes are to be pushed on the stack.
837 unsigned NumBytes = CCInfo.getNextStackOffset();
Evan Chenga8e29892007-01-19 07:51:42 +0000838
839 // Adjust the stack pointer for the new arguments...
840 // These operations are automatically eliminated by the prolog/epilog pass
Chris Lattnere563bbc2008-10-11 22:08:30 +0000841 Chain = DAG.getCALLSEQ_START(Chain, DAG.getIntPtrConstant(NumBytes, true));
Evan Chenga8e29892007-01-19 07:51:42 +0000842
Dan Gohman475871a2008-07-27 21:46:04 +0000843 SDValue StackPtr = DAG.getRegister(ARM::SP, MVT::i32);
Evan Chenga8e29892007-01-19 07:51:42 +0000844
Bob Wilson5bafff32009-06-22 23:27:02 +0000845 RegsToPassVector RegsToPass;
Bob Wilson1f595bb2009-04-17 19:07:39 +0000846 SmallVector<SDValue, 8> MemOpChains;
Evan Chenga8e29892007-01-19 07:51:42 +0000847
Bob Wilson1f595bb2009-04-17 19:07:39 +0000848 // Walk the register/memloc assignments, inserting copies/loads. In the case
Bob Wilsondee46d72009-04-17 20:35:10 +0000849 // of tail call optimization, arguments are handled later.
Bob Wilson1f595bb2009-04-17 19:07:39 +0000850 for (unsigned i = 0, realArgIdx = 0, e = ArgLocs.size();
851 i != e;
852 ++i, ++realArgIdx) {
853 CCValAssign &VA = ArgLocs[i];
854 SDValue Arg = TheCall->getArg(realArgIdx);
855 ISD::ArgFlagsTy Flags = TheCall->getArgFlags(realArgIdx);
Evan Chenga8e29892007-01-19 07:51:42 +0000856
Bob Wilson1f595bb2009-04-17 19:07:39 +0000857 // Promote the value if needed.
858 switch (VA.getLocInfo()) {
859 default: assert(0 && "Unknown loc info!");
860 case CCValAssign::Full: break;
861 case CCValAssign::SExt:
862 Arg = DAG.getNode(ISD::SIGN_EXTEND, dl, VA.getLocVT(), Arg);
863 break;
864 case CCValAssign::ZExt:
865 Arg = DAG.getNode(ISD::ZERO_EXTEND, dl, VA.getLocVT(), Arg);
866 break;
867 case CCValAssign::AExt:
868 Arg = DAG.getNode(ISD::ANY_EXTEND, dl, VA.getLocVT(), Arg);
869 break;
870 case CCValAssign::BCvt:
871 Arg = DAG.getNode(ISD::BIT_CONVERT, dl, VA.getLocVT(), Arg);
872 break;
Evan Chenga8e29892007-01-19 07:51:42 +0000873 }
874
Bob Wilson5bafff32009-06-22 23:27:02 +0000875 // f64 and v2f64 are passed in i32 pairs and must be split into pieces
Bob Wilson1f595bb2009-04-17 19:07:39 +0000876 if (VA.needsCustom()) {
Bob Wilson5bafff32009-06-22 23:27:02 +0000877 if (VA.getLocVT() == MVT::v2f64) {
878 SDValue Op0 = DAG.getNode(ISD::EXTRACT_VECTOR_ELT, dl, MVT::f64, Arg,
879 DAG.getConstant(0, MVT::i32));
880 SDValue Op1 = DAG.getNode(ISD::EXTRACT_VECTOR_ELT, dl, MVT::f64, Arg,
881 DAG.getConstant(1, MVT::i32));
Bob Wilson1f595bb2009-04-17 19:07:39 +0000882
Bob Wilson5bafff32009-06-22 23:27:02 +0000883 PassF64ArgInRegs(TheCall, DAG, Chain, Op0, RegsToPass,
884 VA, ArgLocs[++i], StackPtr, MemOpChains, Flags);
885
886 VA = ArgLocs[++i]; // skip ahead to next loc
887 if (VA.isRegLoc()) {
888 PassF64ArgInRegs(TheCall, DAG, Chain, Op1, RegsToPass,
889 VA, ArgLocs[++i], StackPtr, MemOpChains, Flags);
890 } else {
891 assert(VA.isMemLoc());
892 if (StackPtr.getNode() == 0)
893 StackPtr = DAG.getCopyFromReg(Chain, dl, ARM::SP, getPointerTy());
894
895 MemOpChains.push_back(LowerMemOpCallTo(TheCall, DAG, StackPtr, VA,
896 Chain, Op1, Flags));
897 }
898 } else {
899 PassF64ArgInRegs(TheCall, DAG, Chain, Arg, RegsToPass, VA, ArgLocs[++i],
900 StackPtr, MemOpChains, Flags);
Bob Wilson1f595bb2009-04-17 19:07:39 +0000901 }
902 } else if (VA.isRegLoc()) {
903 RegsToPass.push_back(std::make_pair(VA.getLocReg(), Arg));
904 } else {
905 assert(VA.isMemLoc());
906 if (StackPtr.getNode() == 0)
907 StackPtr = DAG.getCopyFromReg(Chain, dl, ARM::SP, getPointerTy());
908
909 MemOpChains.push_back(LowerMemOpCallTo(TheCall, DAG, StackPtr, VA,
910 Chain, Arg, Flags));
911 }
Evan Chenga8e29892007-01-19 07:51:42 +0000912 }
913
914 if (!MemOpChains.empty())
Dale Johannesen33c960f2009-02-04 20:06:27 +0000915 Chain = DAG.getNode(ISD::TokenFactor, dl, MVT::Other,
Evan Chenga8e29892007-01-19 07:51:42 +0000916 &MemOpChains[0], MemOpChains.size());
917
918 // Build a sequence of copy-to-reg nodes chained together with token chain
919 // and flag operands which copy the outgoing args into the appropriate regs.
Dan Gohman475871a2008-07-27 21:46:04 +0000920 SDValue InFlag;
Evan Chenga8e29892007-01-19 07:51:42 +0000921 for (unsigned i = 0, e = RegsToPass.size(); i != e; ++i) {
Bob Wilson2dc4f542009-03-20 22:42:55 +0000922 Chain = DAG.getCopyToReg(Chain, dl, RegsToPass[i].first,
Dale Johannesen33c960f2009-02-04 20:06:27 +0000923 RegsToPass[i].second, InFlag);
Evan Chenga8e29892007-01-19 07:51:42 +0000924 InFlag = Chain.getValue(1);
925 }
926
Bill Wendling056292f2008-09-16 21:48:12 +0000927 // If the callee is a GlobalAddress/ExternalSymbol node (quite common, every
928 // direct call is) turn it into a TargetGlobalAddress/TargetExternalSymbol
929 // node so that legalize doesn't hack it.
Evan Chenga8e29892007-01-19 07:51:42 +0000930 bool isDirect = false;
931 bool isARMFunc = false;
Evan Cheng277f0742007-06-19 21:05:09 +0000932 bool isLocalARMFunc = false;
Evan Chenga8e29892007-01-19 07:51:42 +0000933 if (GlobalAddressSDNode *G = dyn_cast<GlobalAddressSDNode>(Callee)) {
934 GlobalValue *GV = G->getGlobal();
Evan Chenga8e29892007-01-19 07:51:42 +0000935 isDirect = true;
Reid Spencer5cbf9852007-01-30 20:08:39 +0000936 bool isExt = (GV->isDeclaration() || GV->hasWeakLinkage() ||
Evan Chenga8e29892007-01-19 07:51:42 +0000937 GV->hasLinkOnceLinkage());
Evan Cheng970a4192007-01-19 19:28:01 +0000938 bool isStub = (isExt && Subtarget->isTargetDarwin()) &&
Evan Chenga8e29892007-01-19 07:51:42 +0000939 getTargetMachine().getRelocationModel() != Reloc::Static;
940 isARMFunc = !Subtarget->isThumb() || isStub;
Evan Cheng277f0742007-06-19 21:05:09 +0000941 // ARM call to a local ARM function is predicable.
942 isLocalARMFunc = !Subtarget->isThumb() && !isExt;
Evan Chengc60e76d2007-01-30 20:37:08 +0000943 // tBX takes a register source operand.
944 if (isARMFunc && Subtarget->isThumb() && !Subtarget->hasV5TOps()) {
945 ARMConstantPoolValue *CPV = new ARMConstantPoolValue(GV, ARMPCLabelIndex,
946 ARMCP::CPStub, 4);
Evan Cheng1606e8e2009-03-13 07:51:59 +0000947 SDValue CPAddr = DAG.getTargetConstantPool(CPV, getPointerTy(), 4);
Dale Johannesenb300d2a2009-02-07 00:55:49 +0000948 CPAddr = DAG.getNode(ARMISD::Wrapper, dl, MVT::i32, CPAddr);
Bob Wilson2dc4f542009-03-20 22:42:55 +0000949 Callee = DAG.getLoad(getPointerTy(), dl,
950 DAG.getEntryNode(), CPAddr, NULL, 0);
Dan Gohman475871a2008-07-27 21:46:04 +0000951 SDValue PICLabel = DAG.getConstant(ARMPCLabelIndex++, MVT::i32);
Bob Wilson2dc4f542009-03-20 22:42:55 +0000952 Callee = DAG.getNode(ARMISD::PIC_ADD, dl,
Dale Johannesen33c960f2009-02-04 20:06:27 +0000953 getPointerTy(), Callee, PICLabel);
Evan Chengc60e76d2007-01-30 20:37:08 +0000954 } else
955 Callee = DAG.getTargetGlobalAddress(GV, getPointerTy());
Bill Wendling056292f2008-09-16 21:48:12 +0000956 } else if (ExternalSymbolSDNode *S = dyn_cast<ExternalSymbolSDNode>(Callee)) {
Evan Chenga8e29892007-01-19 07:51:42 +0000957 isDirect = true;
Evan Cheng970a4192007-01-19 19:28:01 +0000958 bool isStub = Subtarget->isTargetDarwin() &&
Evan Chenga8e29892007-01-19 07:51:42 +0000959 getTargetMachine().getRelocationModel() != Reloc::Static;
960 isARMFunc = !Subtarget->isThumb() || isStub;
Evan Chengc60e76d2007-01-30 20:37:08 +0000961 // tBX takes a register source operand.
962 const char *Sym = S->getSymbol();
963 if (isARMFunc && Subtarget->isThumb() && !Subtarget->hasV5TOps()) {
964 ARMConstantPoolValue *CPV = new ARMConstantPoolValue(Sym, ARMPCLabelIndex,
965 ARMCP::CPStub, 4);
Evan Cheng1606e8e2009-03-13 07:51:59 +0000966 SDValue CPAddr = DAG.getTargetConstantPool(CPV, getPointerTy(), 4);
Dale Johannesenb300d2a2009-02-07 00:55:49 +0000967 CPAddr = DAG.getNode(ARMISD::Wrapper, dl, MVT::i32, CPAddr);
Dale Johannesen33c960f2009-02-04 20:06:27 +0000968 Callee = DAG.getLoad(getPointerTy(), dl,
Bob Wilson2dc4f542009-03-20 22:42:55 +0000969 DAG.getEntryNode(), CPAddr, NULL, 0);
Dan Gohman475871a2008-07-27 21:46:04 +0000970 SDValue PICLabel = DAG.getConstant(ARMPCLabelIndex++, MVT::i32);
Bob Wilson2dc4f542009-03-20 22:42:55 +0000971 Callee = DAG.getNode(ARMISD::PIC_ADD, dl,
Dale Johannesen33c960f2009-02-04 20:06:27 +0000972 getPointerTy(), Callee, PICLabel);
Evan Chengc60e76d2007-01-30 20:37:08 +0000973 } else
Bill Wendling056292f2008-09-16 21:48:12 +0000974 Callee = DAG.getTargetExternalSymbol(Sym, getPointerTy());
Evan Chenga8e29892007-01-19 07:51:42 +0000975 }
976
Lauro Ramos Venancio64c88d72007-03-20 17:57:23 +0000977 // FIXME: handle tail calls differently.
978 unsigned CallOpc;
979 if (Subtarget->isThumb()) {
980 if (!Subtarget->hasV5TOps() && (!isDirect || isARMFunc))
981 CallOpc = ARMISD::CALL_NOLINK;
982 else
983 CallOpc = isARMFunc ? ARMISD::CALL : ARMISD::tCALL;
984 } else {
985 CallOpc = (isDirect || Subtarget->hasV5TOps())
Evan Cheng277f0742007-06-19 21:05:09 +0000986 ? (isLocalARMFunc ? ARMISD::CALL_PRED : ARMISD::CALL)
987 : ARMISD::CALL_NOLINK;
Lauro Ramos Venancio64c88d72007-03-20 17:57:23 +0000988 }
Lauro Ramos Venanciob8a93a42007-03-27 16:19:21 +0000989 if (CallOpc == ARMISD::CALL_NOLINK && !Subtarget->isThumb()) {
990 // implicit def LR - LR mustn't be allocated as GRP:$dst of CALL_NOLINK
Dale Johannesene8d72302009-02-06 23:05:02 +0000991 Chain = DAG.getCopyToReg(Chain, dl, ARM::LR, DAG.getUNDEF(MVT::i32),InFlag);
Lauro Ramos Venancio64c88d72007-03-20 17:57:23 +0000992 InFlag = Chain.getValue(1);
993 }
994
Dan Gohman475871a2008-07-27 21:46:04 +0000995 std::vector<SDValue> Ops;
Evan Chenga8e29892007-01-19 07:51:42 +0000996 Ops.push_back(Chain);
997 Ops.push_back(Callee);
998
999 // Add argument registers to the end of the list so that they are known live
1000 // into the call.
1001 for (unsigned i = 0, e = RegsToPass.size(); i != e; ++i)
1002 Ops.push_back(DAG.getRegister(RegsToPass[i].first,
1003 RegsToPass[i].second.getValueType()));
1004
Gabor Greifba36cb52008-08-28 21:40:38 +00001005 if (InFlag.getNode())
Evan Chenga8e29892007-01-19 07:51:42 +00001006 Ops.push_back(InFlag);
Duncan Sands4bdcb612008-07-02 17:40:58 +00001007 // Returns a chain and a flag for retval copy to use.
Dale Johannesen33c960f2009-02-04 20:06:27 +00001008 Chain = DAG.getNode(CallOpc, dl, DAG.getVTList(MVT::Other, MVT::Flag),
Duncan Sands4bdcb612008-07-02 17:40:58 +00001009 &Ops[0], Ops.size());
Evan Chenga8e29892007-01-19 07:51:42 +00001010 InFlag = Chain.getValue(1);
1011
Chris Lattnere563bbc2008-10-11 22:08:30 +00001012 Chain = DAG.getCALLSEQ_END(Chain, DAG.getIntPtrConstant(NumBytes, true),
1013 DAG.getIntPtrConstant(0, true), InFlag);
Evan Chenga8e29892007-01-19 07:51:42 +00001014 if (RetVT != MVT::Other)
1015 InFlag = Chain.getValue(1);
1016
Bob Wilson1f595bb2009-04-17 19:07:39 +00001017 // Handle result values, copying them out of physregs into vregs that we
1018 // return.
1019 return SDValue(LowerCallResult(Chain, InFlag, TheCall, CC, DAG),
1020 Op.getResNo());
Evan Chenga8e29892007-01-19 07:51:42 +00001021}
1022
Bob Wilson1f595bb2009-04-17 19:07:39 +00001023SDValue ARMTargetLowering::LowerRET(SDValue Op, SelectionDAG &DAG) {
1024 // The chain is always operand #0
Dan Gohman475871a2008-07-27 21:46:04 +00001025 SDValue Chain = Op.getOperand(0);
Dale Johannesena05dca42009-02-04 23:02:30 +00001026 DebugLoc dl = Op.getDebugLoc();
Bob Wilson2dc4f542009-03-20 22:42:55 +00001027
Bob Wilsondee46d72009-04-17 20:35:10 +00001028 // CCValAssign - represent the assignment of the return value to a location.
Bob Wilson1f595bb2009-04-17 19:07:39 +00001029 SmallVector<CCValAssign, 16> RVLocs;
1030 unsigned CC = DAG.getMachineFunction().getFunction()->getCallingConv();
1031 bool isVarArg = DAG.getMachineFunction().getFunction()->isVarArg();
1032
Bob Wilsondee46d72009-04-17 20:35:10 +00001033 // CCState - Info about the registers and stack slots.
Bob Wilson1f595bb2009-04-17 19:07:39 +00001034 CCState CCInfo(CC, isVarArg, getTargetMachine(), RVLocs);
1035
Bob Wilsondee46d72009-04-17 20:35:10 +00001036 // Analyze return values of ISD::RET.
Anton Korobeynikov385f5a92009-06-16 18:50:49 +00001037 CCInfo.AnalyzeReturn(Op.getNode(), CCAssignFnForNode(CC, /* Return */ true));
Bob Wilson1f595bb2009-04-17 19:07:39 +00001038
1039 // If this is the first return lowered for this function, add
1040 // the regs to the liveout set for the function.
1041 if (DAG.getMachineFunction().getRegInfo().liveout_empty()) {
1042 for (unsigned i = 0; i != RVLocs.size(); ++i)
1043 if (RVLocs[i].isRegLoc())
1044 DAG.getMachineFunction().getRegInfo().addLiveOut(RVLocs[i].getLocReg());
Evan Chenga8e29892007-01-19 07:51:42 +00001045 }
1046
Bob Wilson1f595bb2009-04-17 19:07:39 +00001047 SDValue Flag;
1048
1049 // Copy the result values into the output registers.
1050 for (unsigned i = 0, realRVLocIdx = 0;
1051 i != RVLocs.size();
1052 ++i, ++realRVLocIdx) {
1053 CCValAssign &VA = RVLocs[i];
1054 assert(VA.isRegLoc() && "Can only return in registers!");
1055
1056 // ISD::RET => ret chain, (regnum1,val1), ...
1057 // So i*2+1 index only the regnums
1058 SDValue Arg = Op.getOperand(realRVLocIdx*2+1);
1059
1060 switch (VA.getLocInfo()) {
1061 default: assert(0 && "Unknown loc info!");
1062 case CCValAssign::Full: break;
1063 case CCValAssign::BCvt:
1064 Arg = DAG.getNode(ISD::BIT_CONVERT, dl, VA.getLocVT(), Arg);
1065 break;
1066 }
1067
Bob Wilson1f595bb2009-04-17 19:07:39 +00001068 if (VA.needsCustom()) {
Bob Wilson5bafff32009-06-22 23:27:02 +00001069 if (VA.getLocVT() == MVT::v2f64) {
1070 // Extract the first half and return it in two registers.
1071 SDValue Half = DAG.getNode(ISD::EXTRACT_VECTOR_ELT, dl, MVT::f64, Arg,
1072 DAG.getConstant(0, MVT::i32));
1073 SDValue HalfGPRs = DAG.getNode(ARMISD::FMRRD, dl,
1074 DAG.getVTList(MVT::i32, MVT::i32), Half);
1075
1076 Chain = DAG.getCopyToReg(Chain, dl, VA.getLocReg(), HalfGPRs, Flag);
1077 Flag = Chain.getValue(1);
1078 VA = RVLocs[++i]; // skip ahead to next loc
1079 Chain = DAG.getCopyToReg(Chain, dl, VA.getLocReg(),
1080 HalfGPRs.getValue(1), Flag);
1081 Flag = Chain.getValue(1);
1082 VA = RVLocs[++i]; // skip ahead to next loc
1083
1084 // Extract the 2nd half and fall through to handle it as an f64 value.
1085 Arg = DAG.getNode(ISD::EXTRACT_VECTOR_ELT, dl, MVT::f64, Arg,
1086 DAG.getConstant(1, MVT::i32));
1087 }
1088 // Legalize ret f64 -> ret 2 x i32. We always have fmrrd if f64 is
1089 // available.
Bob Wilson1f595bb2009-04-17 19:07:39 +00001090 SDValue fmrrd = DAG.getNode(ARMISD::FMRRD, dl,
1091 DAG.getVTList(MVT::i32, MVT::i32), &Arg, 1);
1092 Chain = DAG.getCopyToReg(Chain, dl, VA.getLocReg(), fmrrd, Flag);
Bob Wilson4d59e1d2009-04-24 17:00:36 +00001093 Flag = Chain.getValue(1);
Bob Wilson1f595bb2009-04-17 19:07:39 +00001094 VA = RVLocs[++i]; // skip ahead to next loc
1095 Chain = DAG.getCopyToReg(Chain, dl, VA.getLocReg(), fmrrd.getValue(1),
1096 Flag);
1097 } else
1098 Chain = DAG.getCopyToReg(Chain, dl, VA.getLocReg(), Arg, Flag);
1099
Bob Wilsondee46d72009-04-17 20:35:10 +00001100 // Guarantee that all emitted copies are
1101 // stuck together, avoiding something bad.
Bob Wilson1f595bb2009-04-17 19:07:39 +00001102 Flag = Chain.getValue(1);
1103 }
1104
1105 SDValue result;
1106 if (Flag.getNode())
1107 result = DAG.getNode(ARMISD::RET_FLAG, dl, MVT::Other, Chain, Flag);
1108 else // Return Void
1109 result = DAG.getNode(ARMISD::RET_FLAG, dl, MVT::Other, Chain);
1110
1111 return result;
Evan Chenga8e29892007-01-19 07:51:42 +00001112}
1113
Bob Wilson2dc4f542009-03-20 22:42:55 +00001114// ConstantPool, JumpTable, GlobalAddress, and ExternalSymbol are lowered as
Bill Wendling056292f2008-09-16 21:48:12 +00001115// their target countpart wrapped in the ARMISD::Wrapper node. Suppose N is
1116// one of the above mentioned nodes. It has to be wrapped because otherwise
1117// Select(N) returns N. So the raw TargetGlobalAddress nodes, etc. can only
1118// be used to form addressing mode. These wrapped nodes will be selected
1119// into MOVi.
Dan Gohman475871a2008-07-27 21:46:04 +00001120static SDValue LowerConstantPool(SDValue Op, SelectionDAG &DAG) {
Duncan Sands83ec4b62008-06-06 12:08:01 +00001121 MVT PtrVT = Op.getValueType();
Dale Johannesenb300d2a2009-02-07 00:55:49 +00001122 // FIXME there is no actual debug info here
1123 DebugLoc dl = Op.getDebugLoc();
Evan Chenga8e29892007-01-19 07:51:42 +00001124 ConstantPoolSDNode *CP = cast<ConstantPoolSDNode>(Op);
Dan Gohman475871a2008-07-27 21:46:04 +00001125 SDValue Res;
Evan Chenga8e29892007-01-19 07:51:42 +00001126 if (CP->isMachineConstantPoolEntry())
1127 Res = DAG.getTargetConstantPool(CP->getMachineCPVal(), PtrVT,
1128 CP->getAlignment());
1129 else
1130 Res = DAG.getTargetConstantPool(CP->getConstVal(), PtrVT,
1131 CP->getAlignment());
Dale Johannesenb300d2a2009-02-07 00:55:49 +00001132 return DAG.getNode(ARMISD::Wrapper, dl, MVT::i32, Res);
Evan Chenga8e29892007-01-19 07:51:42 +00001133}
1134
Lauro Ramos Venancio64f4fa52007-04-27 13:54:47 +00001135// Lower ISD::GlobalTLSAddress using the "general dynamic" model
Dan Gohman475871a2008-07-27 21:46:04 +00001136SDValue
Lauro Ramos Venancio64f4fa52007-04-27 13:54:47 +00001137ARMTargetLowering::LowerToTLSGeneralDynamicModel(GlobalAddressSDNode *GA,
1138 SelectionDAG &DAG) {
Dale Johannesen33c960f2009-02-04 20:06:27 +00001139 DebugLoc dl = GA->getDebugLoc();
Duncan Sands83ec4b62008-06-06 12:08:01 +00001140 MVT PtrVT = getPointerTy();
Lauro Ramos Venancio64f4fa52007-04-27 13:54:47 +00001141 unsigned char PCAdj = Subtarget->isThumb() ? 4 : 8;
1142 ARMConstantPoolValue *CPV =
1143 new ARMConstantPoolValue(GA->getGlobal(), ARMPCLabelIndex, ARMCP::CPValue,
1144 PCAdj, "tlsgd", true);
Evan Cheng1606e8e2009-03-13 07:51:59 +00001145 SDValue Argument = DAG.getTargetConstantPool(CPV, PtrVT, 4);
Dale Johannesenb300d2a2009-02-07 00:55:49 +00001146 Argument = DAG.getNode(ARMISD::Wrapper, dl, MVT::i32, Argument);
Dale Johannesen33c960f2009-02-04 20:06:27 +00001147 Argument = DAG.getLoad(PtrVT, dl, DAG.getEntryNode(), Argument, NULL, 0);
Dan Gohman475871a2008-07-27 21:46:04 +00001148 SDValue Chain = Argument.getValue(1);
Lauro Ramos Venancio64f4fa52007-04-27 13:54:47 +00001149
Dan Gohman475871a2008-07-27 21:46:04 +00001150 SDValue PICLabel = DAG.getConstant(ARMPCLabelIndex++, MVT::i32);
Dale Johannesen33c960f2009-02-04 20:06:27 +00001151 Argument = DAG.getNode(ARMISD::PIC_ADD, dl, PtrVT, Argument, PICLabel);
Lauro Ramos Venancio64f4fa52007-04-27 13:54:47 +00001152
1153 // call __tls_get_addr.
1154 ArgListTy Args;
1155 ArgListEntry Entry;
1156 Entry.Node = Argument;
1157 Entry.Ty = (const Type *) Type::Int32Ty;
1158 Args.push_back(Entry);
Dale Johannesen7d2ad622009-01-30 23:10:59 +00001159 // FIXME: is there useful debug info available here?
Dan Gohman475871a2008-07-27 21:46:04 +00001160 std::pair<SDValue, SDValue> CallResult =
Dale Johannesen86098bd2008-09-26 19:31:26 +00001161 LowerCallTo(Chain, (const Type *) Type::Int32Ty, false, false, false, false,
Lauro Ramos Venancio64f4fa52007-04-27 13:54:47 +00001162 CallingConv::C, false,
Dale Johannesen33c960f2009-02-04 20:06:27 +00001163 DAG.getExternalSymbol("__tls_get_addr", PtrVT), Args, DAG, dl);
Lauro Ramos Venancio64f4fa52007-04-27 13:54:47 +00001164 return CallResult.first;
1165}
1166
1167// Lower ISD::GlobalTLSAddress using the "initial exec" or
1168// "local exec" model.
Dan Gohman475871a2008-07-27 21:46:04 +00001169SDValue
Lauro Ramos Venancio64f4fa52007-04-27 13:54:47 +00001170ARMTargetLowering::LowerToTLSExecModels(GlobalAddressSDNode *GA,
Bob Wilson2dc4f542009-03-20 22:42:55 +00001171 SelectionDAG &DAG) {
Lauro Ramos Venancio64f4fa52007-04-27 13:54:47 +00001172 GlobalValue *GV = GA->getGlobal();
Dale Johannesen33c960f2009-02-04 20:06:27 +00001173 DebugLoc dl = GA->getDebugLoc();
Dan Gohman475871a2008-07-27 21:46:04 +00001174 SDValue Offset;
1175 SDValue Chain = DAG.getEntryNode();
Duncan Sands83ec4b62008-06-06 12:08:01 +00001176 MVT PtrVT = getPointerTy();
Lauro Ramos Venancio64f4fa52007-04-27 13:54:47 +00001177 // Get the Thread Pointer
Dale Johannesen33c960f2009-02-04 20:06:27 +00001178 SDValue ThreadPointer = DAG.getNode(ARMISD::THREAD_POINTER, dl, PtrVT);
Lauro Ramos Venancio64f4fa52007-04-27 13:54:47 +00001179
1180 if (GV->isDeclaration()){
1181 // initial exec model
1182 unsigned char PCAdj = Subtarget->isThumb() ? 4 : 8;
1183 ARMConstantPoolValue *CPV =
1184 new ARMConstantPoolValue(GA->getGlobal(), ARMPCLabelIndex, ARMCP::CPValue,
1185 PCAdj, "gottpoff", true);
Evan Cheng1606e8e2009-03-13 07:51:59 +00001186 Offset = DAG.getTargetConstantPool(CPV, PtrVT, 4);
Dale Johannesenb300d2a2009-02-07 00:55:49 +00001187 Offset = DAG.getNode(ARMISD::Wrapper, dl, MVT::i32, Offset);
Dale Johannesen33c960f2009-02-04 20:06:27 +00001188 Offset = DAG.getLoad(PtrVT, dl, Chain, Offset, NULL, 0);
Lauro Ramos Venancio64f4fa52007-04-27 13:54:47 +00001189 Chain = Offset.getValue(1);
1190
Dan Gohman475871a2008-07-27 21:46:04 +00001191 SDValue PICLabel = DAG.getConstant(ARMPCLabelIndex++, MVT::i32);
Dale Johannesen33c960f2009-02-04 20:06:27 +00001192 Offset = DAG.getNode(ARMISD::PIC_ADD, dl, PtrVT, Offset, PICLabel);
Lauro Ramos Venancio64f4fa52007-04-27 13:54:47 +00001193
Dale Johannesen33c960f2009-02-04 20:06:27 +00001194 Offset = DAG.getLoad(PtrVT, dl, Chain, Offset, NULL, 0);
Lauro Ramos Venancio64f4fa52007-04-27 13:54:47 +00001195 } else {
1196 // local exec model
1197 ARMConstantPoolValue *CPV =
1198 new ARMConstantPoolValue(GV, ARMCP::CPValue, "tpoff");
Evan Cheng1606e8e2009-03-13 07:51:59 +00001199 Offset = DAG.getTargetConstantPool(CPV, PtrVT, 4);
Dale Johannesenb300d2a2009-02-07 00:55:49 +00001200 Offset = DAG.getNode(ARMISD::Wrapper, dl, MVT::i32, Offset);
Dale Johannesen33c960f2009-02-04 20:06:27 +00001201 Offset = DAG.getLoad(PtrVT, dl, Chain, Offset, NULL, 0);
Lauro Ramos Venancio64f4fa52007-04-27 13:54:47 +00001202 }
1203
1204 // The address of the thread local variable is the add of the thread
1205 // pointer with the offset of the variable.
Dale Johannesen33c960f2009-02-04 20:06:27 +00001206 return DAG.getNode(ISD::ADD, dl, PtrVT, ThreadPointer, Offset);
Lauro Ramos Venancio64f4fa52007-04-27 13:54:47 +00001207}
1208
Dan Gohman475871a2008-07-27 21:46:04 +00001209SDValue
1210ARMTargetLowering::LowerGlobalTLSAddress(SDValue Op, SelectionDAG &DAG) {
Lauro Ramos Venancio64f4fa52007-04-27 13:54:47 +00001211 // TODO: implement the "local dynamic" model
1212 assert(Subtarget->isTargetELF() &&
1213 "TLS not implemented for non-ELF targets");
1214 GlobalAddressSDNode *GA = cast<GlobalAddressSDNode>(Op);
1215 // If the relocation model is PIC, use the "General Dynamic" TLS Model,
1216 // otherwise use the "Local Exec" TLS Model
1217 if (getTargetMachine().getRelocationModel() == Reloc::PIC_)
1218 return LowerToTLSGeneralDynamicModel(GA, DAG);
1219 else
1220 return LowerToTLSExecModels(GA, DAG);
1221}
1222
Dan Gohman475871a2008-07-27 21:46:04 +00001223SDValue ARMTargetLowering::LowerGlobalAddressELF(SDValue Op,
Bob Wilson2dc4f542009-03-20 22:42:55 +00001224 SelectionDAG &DAG) {
Duncan Sands83ec4b62008-06-06 12:08:01 +00001225 MVT PtrVT = getPointerTy();
Dale Johannesen33c960f2009-02-04 20:06:27 +00001226 DebugLoc dl = Op.getDebugLoc();
Lauro Ramos Venancio0ae4a332007-04-22 00:04:12 +00001227 GlobalValue *GV = cast<GlobalAddressSDNode>(Op)->getGlobal();
1228 Reloc::Model RelocM = getTargetMachine().getRelocationModel();
1229 if (RelocM == Reloc::PIC_) {
Rafael Espindolabb46f522009-01-15 20:18:42 +00001230 bool UseGOTOFF = GV->hasLocalLinkage() || GV->hasHiddenVisibility();
Lauro Ramos Venancio0ae4a332007-04-22 00:04:12 +00001231 ARMConstantPoolValue *CPV =
1232 new ARMConstantPoolValue(GV, ARMCP::CPValue, UseGOTOFF ? "GOTOFF":"GOT");
Evan Cheng1606e8e2009-03-13 07:51:59 +00001233 SDValue CPAddr = DAG.getTargetConstantPool(CPV, PtrVT, 4);
Dale Johannesenb300d2a2009-02-07 00:55:49 +00001234 CPAddr = DAG.getNode(ARMISD::Wrapper, dl, MVT::i32, CPAddr);
Bob Wilson2dc4f542009-03-20 22:42:55 +00001235 SDValue Result = DAG.getLoad(PtrVT, dl, DAG.getEntryNode(),
Dale Johannesen33c960f2009-02-04 20:06:27 +00001236 CPAddr, NULL, 0);
Dan Gohman475871a2008-07-27 21:46:04 +00001237 SDValue Chain = Result.getValue(1);
Dale Johannesenb300d2a2009-02-07 00:55:49 +00001238 SDValue GOT = DAG.getGLOBAL_OFFSET_TABLE(PtrVT);
Dale Johannesen33c960f2009-02-04 20:06:27 +00001239 Result = DAG.getNode(ISD::ADD, dl, PtrVT, Result, GOT);
Lauro Ramos Venancio0ae4a332007-04-22 00:04:12 +00001240 if (!UseGOTOFF)
Dale Johannesen33c960f2009-02-04 20:06:27 +00001241 Result = DAG.getLoad(PtrVT, dl, Chain, Result, NULL, 0);
Lauro Ramos Venancio0ae4a332007-04-22 00:04:12 +00001242 return Result;
1243 } else {
Evan Cheng1606e8e2009-03-13 07:51:59 +00001244 SDValue CPAddr = DAG.getTargetConstantPool(GV, PtrVT, 4);
Dale Johannesenb300d2a2009-02-07 00:55:49 +00001245 CPAddr = DAG.getNode(ARMISD::Wrapper, dl, MVT::i32, CPAddr);
Dale Johannesen33c960f2009-02-04 20:06:27 +00001246 return DAG.getLoad(PtrVT, dl, DAG.getEntryNode(), CPAddr, NULL, 0);
Lauro Ramos Venancio0ae4a332007-04-22 00:04:12 +00001247 }
1248}
1249
Evan Chenga8e29892007-01-19 07:51:42 +00001250/// GVIsIndirectSymbol - true if the GV will be accessed via an indirect symbol
Evan Cheng97c9bb52007-05-04 00:26:58 +00001251/// even in non-static mode.
1252static bool GVIsIndirectSymbol(GlobalValue *GV, Reloc::Model RelocM) {
Evan Chengae94e592008-12-05 01:06:39 +00001253 // If symbol visibility is hidden, the extra load is not needed if
1254 // the symbol is definitely defined in the current translation unit.
1255 bool isDecl = GV->isDeclaration() && !GV->hasNotBeenReadFromBitcode();
1256 if (GV->hasHiddenVisibility() && (!isDecl && !GV->hasCommonLinkage()))
1257 return false;
Duncan Sands667d4b82009-03-07 15:45:40 +00001258 return RelocM != Reloc::Static && (isDecl || GV->isWeakForLinker());
Evan Chenga8e29892007-01-19 07:51:42 +00001259}
1260
Dan Gohman475871a2008-07-27 21:46:04 +00001261SDValue ARMTargetLowering::LowerGlobalAddressDarwin(SDValue Op,
Bob Wilson2dc4f542009-03-20 22:42:55 +00001262 SelectionDAG &DAG) {
Duncan Sands83ec4b62008-06-06 12:08:01 +00001263 MVT PtrVT = getPointerTy();
Dale Johannesen33c960f2009-02-04 20:06:27 +00001264 DebugLoc dl = Op.getDebugLoc();
Evan Chenga8e29892007-01-19 07:51:42 +00001265 GlobalValue *GV = cast<GlobalAddressSDNode>(Op)->getGlobal();
1266 Reloc::Model RelocM = getTargetMachine().getRelocationModel();
Evan Cheng97c9bb52007-05-04 00:26:58 +00001267 bool IsIndirect = GVIsIndirectSymbol(GV, RelocM);
Dan Gohman475871a2008-07-27 21:46:04 +00001268 SDValue CPAddr;
Evan Chenga8e29892007-01-19 07:51:42 +00001269 if (RelocM == Reloc::Static)
Evan Cheng1606e8e2009-03-13 07:51:59 +00001270 CPAddr = DAG.getTargetConstantPool(GV, PtrVT, 4);
Evan Chenga8e29892007-01-19 07:51:42 +00001271 else {
1272 unsigned PCAdj = (RelocM != Reloc::PIC_)
1273 ? 0 : (Subtarget->isThumb() ? 4 : 8);
Evan Chengc60e76d2007-01-30 20:37:08 +00001274 ARMCP::ARMCPKind Kind = IsIndirect ? ARMCP::CPNonLazyPtr
1275 : ARMCP::CPValue;
Evan Chenga8e29892007-01-19 07:51:42 +00001276 ARMConstantPoolValue *CPV = new ARMConstantPoolValue(GV, ARMPCLabelIndex,
Evan Chengc60e76d2007-01-30 20:37:08 +00001277 Kind, PCAdj);
Evan Cheng1606e8e2009-03-13 07:51:59 +00001278 CPAddr = DAG.getTargetConstantPool(CPV, PtrVT, 4);
Evan Chenga8e29892007-01-19 07:51:42 +00001279 }
Dale Johannesenb300d2a2009-02-07 00:55:49 +00001280 CPAddr = DAG.getNode(ARMISD::Wrapper, dl, MVT::i32, CPAddr);
Evan Chenga8e29892007-01-19 07:51:42 +00001281
Dale Johannesen33c960f2009-02-04 20:06:27 +00001282 SDValue Result = DAG.getLoad(PtrVT, dl, DAG.getEntryNode(), CPAddr, NULL, 0);
Dan Gohman475871a2008-07-27 21:46:04 +00001283 SDValue Chain = Result.getValue(1);
Evan Chenga8e29892007-01-19 07:51:42 +00001284
1285 if (RelocM == Reloc::PIC_) {
Dan Gohman475871a2008-07-27 21:46:04 +00001286 SDValue PICLabel = DAG.getConstant(ARMPCLabelIndex++, MVT::i32);
Dale Johannesen33c960f2009-02-04 20:06:27 +00001287 Result = DAG.getNode(ARMISD::PIC_ADD, dl, PtrVT, Result, PICLabel);
Evan Chenga8e29892007-01-19 07:51:42 +00001288 }
1289 if (IsIndirect)
Dale Johannesen33c960f2009-02-04 20:06:27 +00001290 Result = DAG.getLoad(PtrVT, dl, Chain, Result, NULL, 0);
Evan Chenga8e29892007-01-19 07:51:42 +00001291
1292 return Result;
1293}
1294
Dan Gohman475871a2008-07-27 21:46:04 +00001295SDValue ARMTargetLowering::LowerGLOBAL_OFFSET_TABLE(SDValue Op,
Bob Wilson2dc4f542009-03-20 22:42:55 +00001296 SelectionDAG &DAG){
Lauro Ramos Venancio0ae4a332007-04-22 00:04:12 +00001297 assert(Subtarget->isTargetELF() &&
1298 "GLOBAL OFFSET TABLE not implemented for non-ELF targets");
Duncan Sands83ec4b62008-06-06 12:08:01 +00001299 MVT PtrVT = getPointerTy();
Dale Johannesen33c960f2009-02-04 20:06:27 +00001300 DebugLoc dl = Op.getDebugLoc();
Lauro Ramos Venancio0ae4a332007-04-22 00:04:12 +00001301 unsigned PCAdj = Subtarget->isThumb() ? 4 : 8;
1302 ARMConstantPoolValue *CPV = new ARMConstantPoolValue("_GLOBAL_OFFSET_TABLE_",
1303 ARMPCLabelIndex,
1304 ARMCP::CPValue, PCAdj);
Evan Cheng1606e8e2009-03-13 07:51:59 +00001305 SDValue CPAddr = DAG.getTargetConstantPool(CPV, PtrVT, 4);
Dale Johannesenb300d2a2009-02-07 00:55:49 +00001306 CPAddr = DAG.getNode(ARMISD::Wrapper, dl, MVT::i32, CPAddr);
Dale Johannesen33c960f2009-02-04 20:06:27 +00001307 SDValue Result = DAG.getLoad(PtrVT, dl, DAG.getEntryNode(), CPAddr, NULL, 0);
Dan Gohman475871a2008-07-27 21:46:04 +00001308 SDValue PICLabel = DAG.getConstant(ARMPCLabelIndex++, MVT::i32);
Dale Johannesen33c960f2009-02-04 20:06:27 +00001309 return DAG.getNode(ARMISD::PIC_ADD, dl, PtrVT, Result, PICLabel);
Lauro Ramos Venancio0ae4a332007-04-22 00:04:12 +00001310}
1311
Jim Grosbach0e0da732009-05-12 23:59:14 +00001312SDValue
1313ARMTargetLowering::LowerINTRINSIC_WO_CHAIN(SDValue Op, SelectionDAG &DAG) {
Duncan Sands83ec4b62008-06-06 12:08:01 +00001314 MVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
Dan Gohmanf5aeb1a2008-09-12 16:56:44 +00001315 unsigned IntNo = cast<ConstantSDNode>(Op.getOperand(0))->getZExtValue();
Jim Grosbach0e0da732009-05-12 23:59:14 +00001316 DebugLoc dl = Op.getDebugLoc();
Lauro Ramos Venancioe0cb36b2007-11-08 17:20:05 +00001317 switch (IntNo) {
Dan Gohman475871a2008-07-27 21:46:04 +00001318 default: return SDValue(); // Don't custom lower most intrinsics.
Lauro Ramos Venancioe0cb36b2007-11-08 17:20:05 +00001319 case Intrinsic::arm_thread_pointer:
Jim Grosbach0e0da732009-05-12 23:59:14 +00001320 return DAG.getNode(ARMISD::THREAD_POINTER, dl, PtrVT);
Jim Grosbachf9570122009-05-14 00:46:35 +00001321 case Intrinsic::eh_sjlj_setjmp:
1322 SDValue Res = DAG.getNode(ARMISD::EH_SJLJ_SETJMP, dl, MVT::i32,
Jim Grosbach0e0da732009-05-12 23:59:14 +00001323 Op.getOperand(1));
1324 return Res;
Lauro Ramos Venancioe0cb36b2007-11-08 17:20:05 +00001325 }
1326}
1327
Dan Gohman475871a2008-07-27 21:46:04 +00001328static SDValue LowerVASTART(SDValue Op, SelectionDAG &DAG,
Bob Wilson2dc4f542009-03-20 22:42:55 +00001329 unsigned VarArgsFrameIndex) {
Evan Chenga8e29892007-01-19 07:51:42 +00001330 // vastart just stores the address of the VarArgsFrameIndex slot into the
1331 // memory location argument.
Dale Johannesen33c960f2009-02-04 20:06:27 +00001332 DebugLoc dl = Op.getDebugLoc();
Duncan Sands83ec4b62008-06-06 12:08:01 +00001333 MVT PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
Dan Gohman475871a2008-07-27 21:46:04 +00001334 SDValue FR = DAG.getFrameIndex(VarArgsFrameIndex, PtrVT);
Dan Gohman69de1932008-02-06 22:27:42 +00001335 const Value *SV = cast<SrcValueSDNode>(Op.getOperand(2))->getValue();
Dale Johannesen33c960f2009-02-04 20:06:27 +00001336 return DAG.getStore(Op.getOperand(0), dl, FR, Op.getOperand(1), SV, 0);
Evan Chenga8e29892007-01-19 07:51:42 +00001337}
1338
Dan Gohman475871a2008-07-27 21:46:04 +00001339SDValue
Bob Wilson5bafff32009-06-22 23:27:02 +00001340ARMTargetLowering::GetF64FormalArgument(CCValAssign &VA, CCValAssign &NextVA,
1341 SDValue &Root, SelectionDAG &DAG,
1342 DebugLoc dl) {
1343 MachineFunction &MF = DAG.getMachineFunction();
1344 ARMFunctionInfo *AFI = MF.getInfo<ARMFunctionInfo>();
1345
1346 TargetRegisterClass *RC;
1347 if (AFI->isThumbFunction())
1348 RC = ARM::tGPRRegisterClass;
1349 else
1350 RC = ARM::GPRRegisterClass;
1351
1352 // Transform the arguments stored in physical registers into virtual ones.
1353 unsigned Reg = MF.addLiveIn(VA.getLocReg(), RC);
1354 SDValue ArgValue = DAG.getCopyFromReg(Root, dl, Reg, MVT::i32);
1355
1356 SDValue ArgValue2;
1357 if (NextVA.isMemLoc()) {
1358 unsigned ArgSize = NextVA.getLocVT().getSizeInBits()/8;
1359 MachineFrameInfo *MFI = MF.getFrameInfo();
1360 int FI = MFI->CreateFixedObject(ArgSize, NextVA.getLocMemOffset());
1361
1362 // Create load node to retrieve arguments from the stack.
1363 SDValue FIN = DAG.getFrameIndex(FI, getPointerTy());
1364 ArgValue2 = DAG.getLoad(MVT::i32, dl, Root, FIN, NULL, 0);
1365 } else {
1366 Reg = MF.addLiveIn(NextVA.getLocReg(), RC);
1367 ArgValue2 = DAG.getCopyFromReg(Root, dl, Reg, MVT::i32);
1368 }
1369
1370 return DAG.getNode(ARMISD::FMDRR, dl, MVT::f64, ArgValue, ArgValue2);
1371}
1372
1373SDValue
Dan Gohman475871a2008-07-27 21:46:04 +00001374ARMTargetLowering::LowerFORMAL_ARGUMENTS(SDValue Op, SelectionDAG &DAG) {
Bob Wilson1f595bb2009-04-17 19:07:39 +00001375 MachineFunction &MF = DAG.getMachineFunction();
1376 MachineFrameInfo *MFI = MF.getFrameInfo();
1377
Dan Gohman475871a2008-07-27 21:46:04 +00001378 SDValue Root = Op.getOperand(0);
Dale Johannesen33c960f2009-02-04 20:06:27 +00001379 DebugLoc dl = Op.getDebugLoc();
Dan Gohmanf5aeb1a2008-09-12 16:56:44 +00001380 bool isVarArg = cast<ConstantSDNode>(Op.getOperand(2))->getZExtValue() != 0;
Bob Wilson1f595bb2009-04-17 19:07:39 +00001381 unsigned CC = MF.getFunction()->getCallingConv();
1382 ARMFunctionInfo *AFI = MF.getInfo<ARMFunctionInfo>();
1383
1384 // Assign locations to all of the incoming arguments.
1385 SmallVector<CCValAssign, 16> ArgLocs;
1386 CCState CCInfo(CC, isVarArg, getTargetMachine(), ArgLocs);
Anton Korobeynikov385f5a92009-06-16 18:50:49 +00001387 CCInfo.AnalyzeFormalArguments(Op.getNode(),
1388 CCAssignFnForNode(CC, /* Return*/ false));
Bob Wilson1f595bb2009-04-17 19:07:39 +00001389
1390 SmallVector<SDValue, 16> ArgValues;
1391
1392 for (unsigned i = 0, e = ArgLocs.size(); i != e; ++i) {
1393 CCValAssign &VA = ArgLocs[i];
1394
Bob Wilsondee46d72009-04-17 20:35:10 +00001395 // Arguments stored in registers.
Bob Wilson1f595bb2009-04-17 19:07:39 +00001396 if (VA.isRegLoc()) {
1397 MVT RegVT = VA.getLocVT();
Bob Wilson1f595bb2009-04-17 19:07:39 +00001398
Bob Wilson5bafff32009-06-22 23:27:02 +00001399 SDValue ArgValue;
Bob Wilson1f595bb2009-04-17 19:07:39 +00001400 if (VA.needsCustom()) {
Bob Wilson5bafff32009-06-22 23:27:02 +00001401 // f64 and vector types are split up into multiple registers or
1402 // combinations of registers and stack slots.
1403 RegVT = MVT::i32;
Bob Wilson1f595bb2009-04-17 19:07:39 +00001404
Bob Wilson5bafff32009-06-22 23:27:02 +00001405 if (VA.getLocVT() == MVT::v2f64) {
1406 SDValue ArgValue1 = GetF64FormalArgument(VA, ArgLocs[++i],
1407 Root, DAG, dl);
1408 VA = ArgLocs[++i]; // skip ahead to next loc
1409 SDValue ArgValue2 = GetF64FormalArgument(VA, ArgLocs[++i],
1410 Root, DAG, dl);
1411 ArgValue = DAG.getNode(ISD::UNDEF, dl, MVT::v2f64);
1412 ArgValue = DAG.getNode(ISD::INSERT_VECTOR_ELT, dl, MVT::v2f64,
1413 ArgValue, ArgValue1, DAG.getIntPtrConstant(0));
1414 ArgValue = DAG.getNode(ISD::INSERT_VECTOR_ELT, dl, MVT::v2f64,
1415 ArgValue, ArgValue2, DAG.getIntPtrConstant(1));
1416 } else
1417 ArgValue = GetF64FormalArgument(VA, ArgLocs[++i], Root, DAG, dl);
Bob Wilson1f595bb2009-04-17 19:07:39 +00001418
Bob Wilson5bafff32009-06-22 23:27:02 +00001419 } else {
1420 TargetRegisterClass *RC;
1421 if (FloatABIType == FloatABI::Hard && RegVT == MVT::f32)
1422 RC = ARM::SPRRegisterClass;
1423 else if (FloatABIType == FloatABI::Hard && RegVT == MVT::f64)
1424 RC = ARM::DPRRegisterClass;
1425 else if (AFI->isThumbFunction())
1426 RC = ARM::tGPRRegisterClass;
1427 else
1428 RC = ARM::GPRRegisterClass;
Bob Wilson1f595bb2009-04-17 19:07:39 +00001429
Bob Wilson5bafff32009-06-22 23:27:02 +00001430 assert((RegVT == MVT::i32 || RegVT == MVT::f32 ||
1431 (FloatABIType == FloatABI::Hard && RegVT == MVT::f64)) &&
1432 "RegVT not supported by FORMAL_ARGUMENTS Lowering");
1433
1434 // Transform the arguments in physical registers into virtual ones.
1435 unsigned Reg = MF.addLiveIn(VA.getLocReg(), RC);
1436 ArgValue = DAG.getCopyFromReg(Root, dl, Reg, RegVT);
Bob Wilson1f595bb2009-04-17 19:07:39 +00001437 }
1438
1439 // If this is an 8 or 16-bit value, it is really passed promoted
1440 // to 32 bits. Insert an assert[sz]ext to capture this, then
1441 // truncate to the right size.
1442 switch (VA.getLocInfo()) {
1443 default: assert(0 && "Unknown loc info!");
1444 case CCValAssign::Full: break;
1445 case CCValAssign::BCvt:
1446 ArgValue = DAG.getNode(ISD::BIT_CONVERT, dl, VA.getValVT(), ArgValue);
1447 break;
1448 case CCValAssign::SExt:
1449 ArgValue = DAG.getNode(ISD::AssertSext, dl, RegVT, ArgValue,
1450 DAG.getValueType(VA.getValVT()));
1451 ArgValue = DAG.getNode(ISD::TRUNCATE, dl, VA.getValVT(), ArgValue);
1452 break;
1453 case CCValAssign::ZExt:
1454 ArgValue = DAG.getNode(ISD::AssertZext, dl, RegVT, ArgValue,
1455 DAG.getValueType(VA.getValVT()));
1456 ArgValue = DAG.getNode(ISD::TRUNCATE, dl, VA.getValVT(), ArgValue);
1457 break;
1458 }
1459
1460 ArgValues.push_back(ArgValue);
1461
1462 } else { // VA.isRegLoc()
1463
1464 // sanity check
1465 assert(VA.isMemLoc());
1466 assert(VA.getValVT() != MVT::i64 && "i64 should already be lowered");
1467
1468 unsigned ArgSize = VA.getLocVT().getSizeInBits()/8;
1469 int FI = MFI->CreateFixedObject(ArgSize, VA.getLocMemOffset());
1470
Bob Wilsondee46d72009-04-17 20:35:10 +00001471 // Create load nodes to retrieve arguments from the stack.
Bob Wilson1f595bb2009-04-17 19:07:39 +00001472 SDValue FIN = DAG.getFrameIndex(FI, getPointerTy());
1473 ArgValues.push_back(DAG.getLoad(VA.getValVT(), dl, Root, FIN, NULL, 0));
1474 }
1475 }
1476
1477 // varargs
Evan Chenga8e29892007-01-19 07:51:42 +00001478 if (isVarArg) {
1479 static const unsigned GPRArgRegs[] = {
1480 ARM::R0, ARM::R1, ARM::R2, ARM::R3
1481 };
1482
Bob Wilsondee46d72009-04-17 20:35:10 +00001483 unsigned NumGPRs = CCInfo.getFirstUnallocated
1484 (GPRArgRegs, sizeof(GPRArgRegs) / sizeof(GPRArgRegs[0]));
Bob Wilson1f595bb2009-04-17 19:07:39 +00001485
Lauro Ramos Venancio600c3832007-02-23 20:32:57 +00001486 unsigned Align = MF.getTarget().getFrameInfo()->getStackAlignment();
1487 unsigned VARegSize = (4 - NumGPRs) * 4;
1488 unsigned VARegSaveSize = (VARegSize + Align - 1) & ~(Align - 1);
Bob Wilson1f595bb2009-04-17 19:07:39 +00001489 unsigned ArgOffset = 0;
Evan Chenga8e29892007-01-19 07:51:42 +00001490 if (VARegSaveSize) {
1491 // If this function is vararg, store any remaining integer argument regs
1492 // to their spots on the stack so that they may be loaded by deferencing
1493 // the result of va_next.
1494 AFI->setVarArgsRegSaveSize(VARegSaveSize);
Bob Wilson1f595bb2009-04-17 19:07:39 +00001495 ArgOffset = CCInfo.getNextStackOffset();
Lauro Ramos Venancio600c3832007-02-23 20:32:57 +00001496 VarArgsFrameIndex = MFI->CreateFixedObject(VARegSaveSize, ArgOffset +
1497 VARegSaveSize - VARegSize);
Dan Gohman475871a2008-07-27 21:46:04 +00001498 SDValue FIN = DAG.getFrameIndex(VarArgsFrameIndex, getPointerTy());
Evan Chenga8e29892007-01-19 07:51:42 +00001499
Dan Gohman475871a2008-07-27 21:46:04 +00001500 SmallVector<SDValue, 4> MemOps;
Evan Chenga8e29892007-01-19 07:51:42 +00001501 for (; NumGPRs < 4; ++NumGPRs) {
Bob Wilson1f595bb2009-04-17 19:07:39 +00001502 TargetRegisterClass *RC;
Jim Grosbach30eae3c2009-04-07 20:34:09 +00001503 if (AFI->isThumbFunction())
Bob Wilson1f595bb2009-04-17 19:07:39 +00001504 RC = ARM::tGPRRegisterClass;
Jim Grosbach30eae3c2009-04-07 20:34:09 +00001505 else
Bob Wilson1f595bb2009-04-17 19:07:39 +00001506 RC = ARM::GPRRegisterClass;
1507
Bob Wilson998e1252009-04-20 18:36:57 +00001508 unsigned VReg = MF.addLiveIn(GPRArgRegs[NumGPRs], RC);
Dale Johannesen33c960f2009-02-04 20:06:27 +00001509 SDValue Val = DAG.getCopyFromReg(Root, dl, VReg, MVT::i32);
1510 SDValue Store = DAG.getStore(Val.getValue(1), dl, Val, FIN, NULL, 0);
Evan Chenga8e29892007-01-19 07:51:42 +00001511 MemOps.push_back(Store);
Dale Johannesen33c960f2009-02-04 20:06:27 +00001512 FIN = DAG.getNode(ISD::ADD, dl, getPointerTy(), FIN,
Evan Chenga8e29892007-01-19 07:51:42 +00001513 DAG.getConstant(4, getPointerTy()));
1514 }
1515 if (!MemOps.empty())
Dale Johannesen33c960f2009-02-04 20:06:27 +00001516 Root = DAG.getNode(ISD::TokenFactor, dl, MVT::Other,
Evan Chenga8e29892007-01-19 07:51:42 +00001517 &MemOps[0], MemOps.size());
1518 } else
1519 // This will point to the next argument passed via stack.
1520 VarArgsFrameIndex = MFI->CreateFixedObject(4, ArgOffset);
1521 }
1522
1523 ArgValues.push_back(Root);
1524
1525 // Return the new list of results.
Dale Johannesen33c960f2009-02-04 20:06:27 +00001526 return DAG.getNode(ISD::MERGE_VALUES, dl, Op.getNode()->getVTList(),
Bob Wilson1f595bb2009-04-17 19:07:39 +00001527 &ArgValues[0], ArgValues.size()).getValue(Op.getResNo());
Evan Chenga8e29892007-01-19 07:51:42 +00001528}
1529
1530/// isFloatingPointZero - Return true if this is +0.0.
Dan Gohman475871a2008-07-27 21:46:04 +00001531static bool isFloatingPointZero(SDValue Op) {
Evan Chenga8e29892007-01-19 07:51:42 +00001532 if (ConstantFPSDNode *CFP = dyn_cast<ConstantFPSDNode>(Op))
Dale Johanneseneaf08942007-08-31 04:03:46 +00001533 return CFP->getValueAPF().isPosZero();
Gabor Greifba36cb52008-08-28 21:40:38 +00001534 else if (ISD::isEXTLoad(Op.getNode()) || ISD::isNON_EXTLoad(Op.getNode())) {
Evan Chenga8e29892007-01-19 07:51:42 +00001535 // Maybe this has already been legalized into the constant pool?
1536 if (Op.getOperand(1).getOpcode() == ARMISD::Wrapper) {
Dan Gohman475871a2008-07-27 21:46:04 +00001537 SDValue WrapperOp = Op.getOperand(1).getOperand(0);
Evan Chenga8e29892007-01-19 07:51:42 +00001538 if (ConstantPoolSDNode *CP = dyn_cast<ConstantPoolSDNode>(WrapperOp))
1539 if (ConstantFP *CFP = dyn_cast<ConstantFP>(CP->getConstVal()))
Dale Johanneseneaf08942007-08-31 04:03:46 +00001540 return CFP->getValueAPF().isPosZero();
Evan Chenga8e29892007-01-19 07:51:42 +00001541 }
1542 }
1543 return false;
1544}
1545
Evan Cheng9a2ef952007-02-02 01:53:26 +00001546static bool isLegalCmpImmediate(unsigned C, bool isThumb) {
Evan Chenga8e29892007-01-19 07:51:42 +00001547 return ( isThumb && (C & ~255U) == 0) ||
1548 (!isThumb && ARM_AM::getSOImmVal(C) != -1);
1549}
1550
1551/// Returns appropriate ARM CMP (cmp) and corresponding condition code for
1552/// the given operands.
Dan Gohman475871a2008-07-27 21:46:04 +00001553static SDValue getARMCmp(SDValue LHS, SDValue RHS, ISD::CondCode CC,
Dale Johannesende064702009-02-06 21:50:26 +00001554 SDValue &ARMCC, SelectionDAG &DAG, bool isThumb,
1555 DebugLoc dl) {
Gabor Greifba36cb52008-08-28 21:40:38 +00001556 if (ConstantSDNode *RHSC = dyn_cast<ConstantSDNode>(RHS.getNode())) {
Dan Gohmanf5aeb1a2008-09-12 16:56:44 +00001557 unsigned C = RHSC->getZExtValue();
Evan Chenga8e29892007-01-19 07:51:42 +00001558 if (!isLegalCmpImmediate(C, isThumb)) {
1559 // Constant does not fit, try adjusting it by one?
1560 switch (CC) {
1561 default: break;
1562 case ISD::SETLT:
Evan Chenga8e29892007-01-19 07:51:42 +00001563 case ISD::SETGE:
Evan Chenga8e29892007-01-19 07:51:42 +00001564 if (isLegalCmpImmediate(C-1, isThumb)) {
Evan Cheng9a2ef952007-02-02 01:53:26 +00001565 CC = (CC == ISD::SETLT) ? ISD::SETLE : ISD::SETGT;
1566 RHS = DAG.getConstant(C-1, MVT::i32);
1567 }
1568 break;
1569 case ISD::SETULT:
1570 case ISD::SETUGE:
1571 if (C > 0 && isLegalCmpImmediate(C-1, isThumb)) {
1572 CC = (CC == ISD::SETULT) ? ISD::SETULE : ISD::SETUGT;
Evan Chenga8e29892007-01-19 07:51:42 +00001573 RHS = DAG.getConstant(C-1, MVT::i32);
1574 }
1575 break;
1576 case ISD::SETLE:
Evan Chenga8e29892007-01-19 07:51:42 +00001577 case ISD::SETGT:
Evan Chenga8e29892007-01-19 07:51:42 +00001578 if (isLegalCmpImmediate(C+1, isThumb)) {
Evan Cheng9a2ef952007-02-02 01:53:26 +00001579 CC = (CC == ISD::SETLE) ? ISD::SETLT : ISD::SETGE;
1580 RHS = DAG.getConstant(C+1, MVT::i32);
1581 }
1582 break;
1583 case ISD::SETULE:
1584 case ISD::SETUGT:
1585 if (C < 0xffffffff && isLegalCmpImmediate(C+1, isThumb)) {
1586 CC = (CC == ISD::SETULE) ? ISD::SETULT : ISD::SETUGE;
Evan Chenga8e29892007-01-19 07:51:42 +00001587 RHS = DAG.getConstant(C+1, MVT::i32);
1588 }
1589 break;
1590 }
1591 }
1592 }
1593
1594 ARMCC::CondCodes CondCode = IntCCToARMCC(CC);
Lauro Ramos Venancio99966632007-04-02 01:30:03 +00001595 ARMISD::NodeType CompareType;
1596 switch (CondCode) {
1597 default:
1598 CompareType = ARMISD::CMP;
1599 break;
1600 case ARMCC::EQ:
1601 case ARMCC::NE:
David Goodwinc0309b42009-06-29 15:33:01 +00001602 // Uses only Z Flag
1603 CompareType = ARMISD::CMPZ;
Lauro Ramos Venancio99966632007-04-02 01:30:03 +00001604 break;
1605 }
Evan Chenga8e29892007-01-19 07:51:42 +00001606 ARMCC = DAG.getConstant(CondCode, MVT::i32);
Dale Johannesende064702009-02-06 21:50:26 +00001607 return DAG.getNode(CompareType, dl, MVT::Flag, LHS, RHS);
Evan Chenga8e29892007-01-19 07:51:42 +00001608}
1609
1610/// Returns a appropriate VFP CMP (fcmp{s|d}+fmstat) for the given operands.
Bob Wilson2dc4f542009-03-20 22:42:55 +00001611static SDValue getVFPCmp(SDValue LHS, SDValue RHS, SelectionDAG &DAG,
Dale Johannesende064702009-02-06 21:50:26 +00001612 DebugLoc dl) {
Dan Gohman475871a2008-07-27 21:46:04 +00001613 SDValue Cmp;
Evan Chenga8e29892007-01-19 07:51:42 +00001614 if (!isFloatingPointZero(RHS))
Dale Johannesende064702009-02-06 21:50:26 +00001615 Cmp = DAG.getNode(ARMISD::CMPFP, dl, MVT::Flag, LHS, RHS);
Evan Chenga8e29892007-01-19 07:51:42 +00001616 else
Dale Johannesende064702009-02-06 21:50:26 +00001617 Cmp = DAG.getNode(ARMISD::CMPFPw0, dl, MVT::Flag, LHS);
1618 return DAG.getNode(ARMISD::FMSTAT, dl, MVT::Flag, Cmp);
Evan Chenga8e29892007-01-19 07:51:42 +00001619}
1620
Dan Gohman475871a2008-07-27 21:46:04 +00001621static SDValue LowerSELECT_CC(SDValue Op, SelectionDAG &DAG,
Bob Wilson2dc4f542009-03-20 22:42:55 +00001622 const ARMSubtarget *ST) {
Duncan Sands83ec4b62008-06-06 12:08:01 +00001623 MVT VT = Op.getValueType();
Dan Gohman475871a2008-07-27 21:46:04 +00001624 SDValue LHS = Op.getOperand(0);
1625 SDValue RHS = Op.getOperand(1);
Evan Chenga8e29892007-01-19 07:51:42 +00001626 ISD::CondCode CC = cast<CondCodeSDNode>(Op.getOperand(4))->get();
Dan Gohman475871a2008-07-27 21:46:04 +00001627 SDValue TrueVal = Op.getOperand(2);
1628 SDValue FalseVal = Op.getOperand(3);
Dale Johannesende064702009-02-06 21:50:26 +00001629 DebugLoc dl = Op.getDebugLoc();
Evan Chenga8e29892007-01-19 07:51:42 +00001630
1631 if (LHS.getValueType() == MVT::i32) {
Dan Gohman475871a2008-07-27 21:46:04 +00001632 SDValue ARMCC;
1633 SDValue CCR = DAG.getRegister(ARM::CPSR, MVT::i32);
Dale Johannesende064702009-02-06 21:50:26 +00001634 SDValue Cmp = getARMCmp(LHS, RHS, CC, ARMCC, DAG, ST->isThumb(), dl);
1635 return DAG.getNode(ARMISD::CMOV, dl, VT, FalseVal, TrueVal, ARMCC, CCR,Cmp);
Evan Chenga8e29892007-01-19 07:51:42 +00001636 }
1637
1638 ARMCC::CondCodes CondCode, CondCode2;
1639 if (FPCCToARMCC(CC, CondCode, CondCode2))
1640 std::swap(TrueVal, FalseVal);
1641
Dan Gohman475871a2008-07-27 21:46:04 +00001642 SDValue ARMCC = DAG.getConstant(CondCode, MVT::i32);
1643 SDValue CCR = DAG.getRegister(ARM::CPSR, MVT::i32);
Dale Johannesende064702009-02-06 21:50:26 +00001644 SDValue Cmp = getVFPCmp(LHS, RHS, DAG, dl);
1645 SDValue Result = DAG.getNode(ARMISD::CMOV, dl, VT, FalseVal, TrueVal,
Evan Cheng0e1d3792007-07-05 07:18:20 +00001646 ARMCC, CCR, Cmp);
Evan Chenga8e29892007-01-19 07:51:42 +00001647 if (CondCode2 != ARMCC::AL) {
Dan Gohman475871a2008-07-27 21:46:04 +00001648 SDValue ARMCC2 = DAG.getConstant(CondCode2, MVT::i32);
Evan Chenga8e29892007-01-19 07:51:42 +00001649 // FIXME: Needs another CMP because flag can have but one use.
Dale Johannesende064702009-02-06 21:50:26 +00001650 SDValue Cmp2 = getVFPCmp(LHS, RHS, DAG, dl);
Bob Wilson2dc4f542009-03-20 22:42:55 +00001651 Result = DAG.getNode(ARMISD::CMOV, dl, VT,
Dale Johannesende064702009-02-06 21:50:26 +00001652 Result, TrueVal, ARMCC2, CCR, Cmp2);
Evan Chenga8e29892007-01-19 07:51:42 +00001653 }
1654 return Result;
1655}
1656
Dan Gohman475871a2008-07-27 21:46:04 +00001657static SDValue LowerBR_CC(SDValue Op, SelectionDAG &DAG,
Bob Wilson2dc4f542009-03-20 22:42:55 +00001658 const ARMSubtarget *ST) {
Dan Gohman475871a2008-07-27 21:46:04 +00001659 SDValue Chain = Op.getOperand(0);
Evan Chenga8e29892007-01-19 07:51:42 +00001660 ISD::CondCode CC = cast<CondCodeSDNode>(Op.getOperand(1))->get();
Dan Gohman475871a2008-07-27 21:46:04 +00001661 SDValue LHS = Op.getOperand(2);
1662 SDValue RHS = Op.getOperand(3);
1663 SDValue Dest = Op.getOperand(4);
Dale Johannesende064702009-02-06 21:50:26 +00001664 DebugLoc dl = Op.getDebugLoc();
Evan Chenga8e29892007-01-19 07:51:42 +00001665
1666 if (LHS.getValueType() == MVT::i32) {
Dan Gohman475871a2008-07-27 21:46:04 +00001667 SDValue ARMCC;
1668 SDValue CCR = DAG.getRegister(ARM::CPSR, MVT::i32);
Dale Johannesende064702009-02-06 21:50:26 +00001669 SDValue Cmp = getARMCmp(LHS, RHS, CC, ARMCC, DAG, ST->isThumb(), dl);
Bob Wilson2dc4f542009-03-20 22:42:55 +00001670 return DAG.getNode(ARMISD::BRCOND, dl, MVT::Other,
Dale Johannesende064702009-02-06 21:50:26 +00001671 Chain, Dest, ARMCC, CCR,Cmp);
Evan Chenga8e29892007-01-19 07:51:42 +00001672 }
1673
1674 assert(LHS.getValueType() == MVT::f32 || LHS.getValueType() == MVT::f64);
1675 ARMCC::CondCodes CondCode, CondCode2;
1676 if (FPCCToARMCC(CC, CondCode, CondCode2))
1677 // Swap the LHS/RHS of the comparison if needed.
1678 std::swap(LHS, RHS);
Bob Wilson2dc4f542009-03-20 22:42:55 +00001679
Dale Johannesende064702009-02-06 21:50:26 +00001680 SDValue Cmp = getVFPCmp(LHS, RHS, DAG, dl);
Dan Gohman475871a2008-07-27 21:46:04 +00001681 SDValue ARMCC = DAG.getConstant(CondCode, MVT::i32);
1682 SDValue CCR = DAG.getRegister(ARM::CPSR, MVT::i32);
Evan Chenga8e29892007-01-19 07:51:42 +00001683 SDVTList VTList = DAG.getVTList(MVT::Other, MVT::Flag);
Dan Gohman475871a2008-07-27 21:46:04 +00001684 SDValue Ops[] = { Chain, Dest, ARMCC, CCR, Cmp };
Dale Johannesende064702009-02-06 21:50:26 +00001685 SDValue Res = DAG.getNode(ARMISD::BRCOND, dl, VTList, Ops, 5);
Evan Chenga8e29892007-01-19 07:51:42 +00001686 if (CondCode2 != ARMCC::AL) {
1687 ARMCC = DAG.getConstant(CondCode2, MVT::i32);
Dan Gohman475871a2008-07-27 21:46:04 +00001688 SDValue Ops[] = { Res, Dest, ARMCC, CCR, Res.getValue(1) };
Dale Johannesende064702009-02-06 21:50:26 +00001689 Res = DAG.getNode(ARMISD::BRCOND, dl, VTList, Ops, 5);
Evan Chenga8e29892007-01-19 07:51:42 +00001690 }
1691 return Res;
1692}
1693
Dan Gohman475871a2008-07-27 21:46:04 +00001694SDValue ARMTargetLowering::LowerBR_JT(SDValue Op, SelectionDAG &DAG) {
1695 SDValue Chain = Op.getOperand(0);
1696 SDValue Table = Op.getOperand(1);
1697 SDValue Index = Op.getOperand(2);
Dale Johannesen33c960f2009-02-04 20:06:27 +00001698 DebugLoc dl = Op.getDebugLoc();
Evan Chenga8e29892007-01-19 07:51:42 +00001699
Duncan Sands83ec4b62008-06-06 12:08:01 +00001700 MVT PTy = getPointerTy();
Evan Chenga8e29892007-01-19 07:51:42 +00001701 JumpTableSDNode *JT = cast<JumpTableSDNode>(Table);
1702 ARMFunctionInfo *AFI = DAG.getMachineFunction().getInfo<ARMFunctionInfo>();
Dan Gohman475871a2008-07-27 21:46:04 +00001703 SDValue UId = DAG.getConstant(AFI->createJumpTableUId(), PTy);
1704 SDValue JTI = DAG.getTargetJumpTable(JT->getIndex(), PTy);
Dale Johannesende064702009-02-06 21:50:26 +00001705 Table = DAG.getNode(ARMISD::WrapperJT, dl, MVT::i32, JTI, UId);
Dale Johannesen33c960f2009-02-04 20:06:27 +00001706 Index = DAG.getNode(ISD::MUL, dl, PTy, Index, DAG.getConstant(4, PTy));
1707 SDValue Addr = DAG.getNode(ISD::ADD, dl, PTy, Index, Table);
Evan Chenga8e29892007-01-19 07:51:42 +00001708 bool isPIC = getTargetMachine().getRelocationModel() == Reloc::PIC_;
Dale Johannesen33c960f2009-02-04 20:06:27 +00001709 Addr = DAG.getLoad(isPIC ? (MVT)MVT::i32 : PTy, dl,
Evan Chenge2446c62007-06-26 18:31:22 +00001710 Chain, Addr, NULL, 0);
Evan Chenga8e29892007-01-19 07:51:42 +00001711 Chain = Addr.getValue(1);
1712 if (isPIC)
Dale Johannesen33c960f2009-02-04 20:06:27 +00001713 Addr = DAG.getNode(ISD::ADD, dl, PTy, Addr, Table);
1714 return DAG.getNode(ARMISD::BR_JT, dl, MVT::Other, Chain, Addr, JTI, UId);
Evan Chenga8e29892007-01-19 07:51:42 +00001715}
1716
Dan Gohman475871a2008-07-27 21:46:04 +00001717static SDValue LowerFP_TO_INT(SDValue Op, SelectionDAG &DAG) {
Dale Johannesende064702009-02-06 21:50:26 +00001718 DebugLoc dl = Op.getDebugLoc();
Evan Chenga8e29892007-01-19 07:51:42 +00001719 unsigned Opc =
1720 Op.getOpcode() == ISD::FP_TO_SINT ? ARMISD::FTOSI : ARMISD::FTOUI;
Dale Johannesende064702009-02-06 21:50:26 +00001721 Op = DAG.getNode(Opc, dl, MVT::f32, Op.getOperand(0));
1722 return DAG.getNode(ISD::BIT_CONVERT, dl, MVT::i32, Op);
Evan Chenga8e29892007-01-19 07:51:42 +00001723}
1724
Dan Gohman475871a2008-07-27 21:46:04 +00001725static SDValue LowerINT_TO_FP(SDValue Op, SelectionDAG &DAG) {
Duncan Sands83ec4b62008-06-06 12:08:01 +00001726 MVT VT = Op.getValueType();
Dale Johannesende064702009-02-06 21:50:26 +00001727 DebugLoc dl = Op.getDebugLoc();
Evan Chenga8e29892007-01-19 07:51:42 +00001728 unsigned Opc =
1729 Op.getOpcode() == ISD::SINT_TO_FP ? ARMISD::SITOF : ARMISD::UITOF;
1730
Dale Johannesende064702009-02-06 21:50:26 +00001731 Op = DAG.getNode(ISD::BIT_CONVERT, dl, MVT::f32, Op.getOperand(0));
1732 return DAG.getNode(Opc, dl, VT, Op);
Evan Chenga8e29892007-01-19 07:51:42 +00001733}
1734
Dan Gohman475871a2008-07-27 21:46:04 +00001735static SDValue LowerFCOPYSIGN(SDValue Op, SelectionDAG &DAG) {
Evan Chenga8e29892007-01-19 07:51:42 +00001736 // Implement fcopysign with a fabs and a conditional fneg.
Dan Gohman475871a2008-07-27 21:46:04 +00001737 SDValue Tmp0 = Op.getOperand(0);
1738 SDValue Tmp1 = Op.getOperand(1);
Dale Johannesende064702009-02-06 21:50:26 +00001739 DebugLoc dl = Op.getDebugLoc();
Duncan Sands83ec4b62008-06-06 12:08:01 +00001740 MVT VT = Op.getValueType();
1741 MVT SrcVT = Tmp1.getValueType();
Dale Johannesende064702009-02-06 21:50:26 +00001742 SDValue AbsVal = DAG.getNode(ISD::FABS, dl, VT, Tmp0);
1743 SDValue Cmp = getVFPCmp(Tmp1, DAG.getConstantFP(0.0, SrcVT), DAG, dl);
Dan Gohman475871a2008-07-27 21:46:04 +00001744 SDValue ARMCC = DAG.getConstant(ARMCC::LT, MVT::i32);
1745 SDValue CCR = DAG.getRegister(ARM::CPSR, MVT::i32);
Dale Johannesende064702009-02-06 21:50:26 +00001746 return DAG.getNode(ARMISD::CNEG, dl, VT, AbsVal, AbsVal, ARMCC, CCR, Cmp);
Evan Chenga8e29892007-01-19 07:51:42 +00001747}
1748
Jim Grosbach0e0da732009-05-12 23:59:14 +00001749SDValue ARMTargetLowering::LowerFRAMEADDR(SDValue Op, SelectionDAG &DAG) {
1750 MachineFrameInfo *MFI = DAG.getMachineFunction().getFrameInfo();
1751 MFI->setFrameAddressIsTaken(true);
1752 MVT VT = Op.getValueType();
1753 DebugLoc dl = Op.getDebugLoc(); // FIXME probably not meaningful
1754 unsigned Depth = cast<ConstantSDNode>(Op.getOperand(0))->getZExtValue();
Evan Chengcd828612009-06-18 23:14:30 +00001755 unsigned FrameReg = (Subtarget->isThumb() || Subtarget->isTargetDarwin())
Jim Grosbach0e0da732009-05-12 23:59:14 +00001756 ? ARM::R7 : ARM::R11;
1757 SDValue FrameAddr = DAG.getCopyFromReg(DAG.getEntryNode(), dl, FrameReg, VT);
1758 while (Depth--)
1759 FrameAddr = DAG.getLoad(VT, dl, DAG.getEntryNode(), FrameAddr, NULL, 0);
1760 return FrameAddr;
1761}
1762
Dan Gohman475871a2008-07-27 21:46:04 +00001763SDValue
Dale Johannesen0f502f62009-02-03 22:26:09 +00001764ARMTargetLowering::EmitTargetCodeForMemcpy(SelectionDAG &DAG, DebugLoc dl,
Dan Gohman475871a2008-07-27 21:46:04 +00001765 SDValue Chain,
1766 SDValue Dst, SDValue Src,
1767 SDValue Size, unsigned Align,
Dan Gohman707e0182008-04-12 04:36:06 +00001768 bool AlwaysInline,
Dan Gohman1f13c682008-04-28 17:15:20 +00001769 const Value *DstSV, uint64_t DstSVOff,
1770 const Value *SrcSV, uint64_t SrcSVOff){
Evan Cheng4102eb52007-10-22 22:11:27 +00001771 // Do repeated 4-byte loads and stores. To be improved.
Dan Gohman707e0182008-04-12 04:36:06 +00001772 // This requires 4-byte alignment.
1773 if ((Align & 3) != 0)
Dan Gohman475871a2008-07-27 21:46:04 +00001774 return SDValue();
Dan Gohman707e0182008-04-12 04:36:06 +00001775 // This requires the copy size to be a constant, preferrably
1776 // within a subtarget-specific limit.
1777 ConstantSDNode *ConstantSize = dyn_cast<ConstantSDNode>(Size);
1778 if (!ConstantSize)
Dan Gohman475871a2008-07-27 21:46:04 +00001779 return SDValue();
Dan Gohmanf5aeb1a2008-09-12 16:56:44 +00001780 uint64_t SizeVal = ConstantSize->getZExtValue();
Dan Gohman707e0182008-04-12 04:36:06 +00001781 if (!AlwaysInline && SizeVal > getSubtarget()->getMaxInlineSizeThreshold())
Dan Gohman475871a2008-07-27 21:46:04 +00001782 return SDValue();
Dan Gohman707e0182008-04-12 04:36:06 +00001783
1784 unsigned BytesLeft = SizeVal & 3;
1785 unsigned NumMemOps = SizeVal >> 2;
Dale Johannesen8dd86c12007-05-17 21:31:21 +00001786 unsigned EmittedNumMemOps = 0;
Duncan Sands83ec4b62008-06-06 12:08:01 +00001787 MVT VT = MVT::i32;
Dale Johannesen8dd86c12007-05-17 21:31:21 +00001788 unsigned VTSize = 4;
Evan Cheng4102eb52007-10-22 22:11:27 +00001789 unsigned i = 0;
Evan Chenge5e7ce42007-05-18 01:19:57 +00001790 const unsigned MAX_LOADS_IN_LDM = 6;
Dan Gohman475871a2008-07-27 21:46:04 +00001791 SDValue TFOps[MAX_LOADS_IN_LDM];
1792 SDValue Loads[MAX_LOADS_IN_LDM];
Dan Gohman1f13c682008-04-28 17:15:20 +00001793 uint64_t SrcOff = 0, DstOff = 0;
Dale Johannesen8dd86c12007-05-17 21:31:21 +00001794
Evan Cheng4102eb52007-10-22 22:11:27 +00001795 // Emit up to MAX_LOADS_IN_LDM loads, then a TokenFactor barrier, then the
1796 // same number of stores. The loads and stores will get combined into
Dale Johannesen8dd86c12007-05-17 21:31:21 +00001797 // ldm/stm later on.
Evan Cheng4102eb52007-10-22 22:11:27 +00001798 while (EmittedNumMemOps < NumMemOps) {
1799 for (i = 0;
1800 i < MAX_LOADS_IN_LDM && EmittedNumMemOps + i < NumMemOps; ++i) {
Dale Johannesen0f502f62009-02-03 22:26:09 +00001801 Loads[i] = DAG.getLoad(VT, dl, Chain,
1802 DAG.getNode(ISD::ADD, dl, MVT::i32, Src,
Evan Cheng4102eb52007-10-22 22:11:27 +00001803 DAG.getConstant(SrcOff, MVT::i32)),
Dan Gohman1f13c682008-04-28 17:15:20 +00001804 SrcSV, SrcSVOff + SrcOff);
Evan Cheng4102eb52007-10-22 22:11:27 +00001805 TFOps[i] = Loads[i].getValue(1);
Dale Johannesen8dd86c12007-05-17 21:31:21 +00001806 SrcOff += VTSize;
1807 }
Dale Johannesen0f502f62009-02-03 22:26:09 +00001808 Chain = DAG.getNode(ISD::TokenFactor, dl, MVT::Other, &TFOps[0], i);
Dale Johannesen8dd86c12007-05-17 21:31:21 +00001809
Evan Cheng4102eb52007-10-22 22:11:27 +00001810 for (i = 0;
1811 i < MAX_LOADS_IN_LDM && EmittedNumMemOps + i < NumMemOps; ++i) {
Dale Johannesen0f502f62009-02-03 22:26:09 +00001812 TFOps[i] = DAG.getStore(Chain, dl, Loads[i],
Bob Wilson2dc4f542009-03-20 22:42:55 +00001813 DAG.getNode(ISD::ADD, dl, MVT::i32, Dst,
Evan Cheng4102eb52007-10-22 22:11:27 +00001814 DAG.getConstant(DstOff, MVT::i32)),
Dan Gohman1f13c682008-04-28 17:15:20 +00001815 DstSV, DstSVOff + DstOff);
Dale Johannesen8dd86c12007-05-17 21:31:21 +00001816 DstOff += VTSize;
1817 }
Dale Johannesen0f502f62009-02-03 22:26:09 +00001818 Chain = DAG.getNode(ISD::TokenFactor, dl, MVT::Other, &TFOps[0], i);
Evan Cheng4102eb52007-10-22 22:11:27 +00001819
Dale Johannesen8dd86c12007-05-17 21:31:21 +00001820 EmittedNumMemOps += i;
1821 }
1822
Bob Wilson2dc4f542009-03-20 22:42:55 +00001823 if (BytesLeft == 0)
Evan Cheng4102eb52007-10-22 22:11:27 +00001824 return Chain;
1825
1826 // Issue loads / stores for the trailing (1 - 3) bytes.
1827 unsigned BytesLeftSave = BytesLeft;
1828 i = 0;
1829 while (BytesLeft) {
1830 if (BytesLeft >= 2) {
1831 VT = MVT::i16;
1832 VTSize = 2;
1833 } else {
1834 VT = MVT::i8;
1835 VTSize = 1;
1836 }
1837
Dale Johannesen0f502f62009-02-03 22:26:09 +00001838 Loads[i] = DAG.getLoad(VT, dl, Chain,
1839 DAG.getNode(ISD::ADD, dl, MVT::i32, Src,
Evan Cheng4102eb52007-10-22 22:11:27 +00001840 DAG.getConstant(SrcOff, MVT::i32)),
Dan Gohman1f13c682008-04-28 17:15:20 +00001841 SrcSV, SrcSVOff + SrcOff);
Evan Cheng4102eb52007-10-22 22:11:27 +00001842 TFOps[i] = Loads[i].getValue(1);
1843 ++i;
1844 SrcOff += VTSize;
1845 BytesLeft -= VTSize;
1846 }
Dale Johannesen0f502f62009-02-03 22:26:09 +00001847 Chain = DAG.getNode(ISD::TokenFactor, dl, MVT::Other, &TFOps[0], i);
Evan Cheng4102eb52007-10-22 22:11:27 +00001848
1849 i = 0;
1850 BytesLeft = BytesLeftSave;
1851 while (BytesLeft) {
1852 if (BytesLeft >= 2) {
1853 VT = MVT::i16;
1854 VTSize = 2;
1855 } else {
1856 VT = MVT::i8;
1857 VTSize = 1;
1858 }
1859
Dale Johannesen0f502f62009-02-03 22:26:09 +00001860 TFOps[i] = DAG.getStore(Chain, dl, Loads[i],
Bob Wilson2dc4f542009-03-20 22:42:55 +00001861 DAG.getNode(ISD::ADD, dl, MVT::i32, Dst,
Evan Cheng4102eb52007-10-22 22:11:27 +00001862 DAG.getConstant(DstOff, MVT::i32)),
Dan Gohman1f13c682008-04-28 17:15:20 +00001863 DstSV, DstSVOff + DstOff);
Evan Cheng4102eb52007-10-22 22:11:27 +00001864 ++i;
1865 DstOff += VTSize;
1866 BytesLeft -= VTSize;
1867 }
Dale Johannesen0f502f62009-02-03 22:26:09 +00001868 return DAG.getNode(ISD::TokenFactor, dl, MVT::Other, &TFOps[0], i);
Dale Johannesen8dd86c12007-05-17 21:31:21 +00001869}
1870
Duncan Sands1607f052008-12-01 11:39:25 +00001871static SDValue ExpandBIT_CONVERT(SDNode *N, SelectionDAG &DAG) {
Dan Gohman475871a2008-07-27 21:46:04 +00001872 SDValue Op = N->getOperand(0);
Dale Johannesende064702009-02-06 21:50:26 +00001873 DebugLoc dl = N->getDebugLoc();
Evan Chengc7c77292008-11-04 19:57:48 +00001874 if (N->getValueType(0) == MVT::f64) {
1875 // Turn i64->f64 into FMDRR.
Dale Johannesende064702009-02-06 21:50:26 +00001876 SDValue Lo = DAG.getNode(ISD::EXTRACT_ELEMENT, dl, MVT::i32, Op,
Evan Chengc7c77292008-11-04 19:57:48 +00001877 DAG.getConstant(0, MVT::i32));
Dale Johannesende064702009-02-06 21:50:26 +00001878 SDValue Hi = DAG.getNode(ISD::EXTRACT_ELEMENT, dl, MVT::i32, Op,
Evan Chengc7c77292008-11-04 19:57:48 +00001879 DAG.getConstant(1, MVT::i32));
Dale Johannesende064702009-02-06 21:50:26 +00001880 return DAG.getNode(ARMISD::FMDRR, dl, MVT::f64, Lo, Hi);
Evan Chengc7c77292008-11-04 19:57:48 +00001881 }
Bob Wilson2dc4f542009-03-20 22:42:55 +00001882
Evan Chengc7c77292008-11-04 19:57:48 +00001883 // Turn f64->i64 into FMRRD.
Bob Wilson2dc4f542009-03-20 22:42:55 +00001884 SDValue Cvt = DAG.getNode(ARMISD::FMRRD, dl,
Dale Johannesende064702009-02-06 21:50:26 +00001885 DAG.getVTList(MVT::i32, MVT::i32), &Op, 1);
Bob Wilson2dc4f542009-03-20 22:42:55 +00001886
Chris Lattner27a6c732007-11-24 07:07:01 +00001887 // Merge the pieces into a single i64 value.
Dale Johannesende064702009-02-06 21:50:26 +00001888 return DAG.getNode(ISD::BUILD_PAIR, dl, MVT::i64, Cvt, Cvt.getValue(1));
Chris Lattner27a6c732007-11-24 07:07:01 +00001889}
1890
Bob Wilson5bafff32009-06-22 23:27:02 +00001891/// getZeroVector - Returns a vector of specified type with all zero elements.
1892///
1893static SDValue getZeroVector(MVT VT, SelectionDAG &DAG, DebugLoc dl) {
1894 assert(VT.isVector() && "Expected a vector type");
1895
1896 // Zero vectors are used to represent vector negation and in those cases
1897 // will be implemented with the NEON VNEG instruction. However, VNEG does
1898 // not support i64 elements, so sometimes the zero vectors will need to be
1899 // explicitly constructed. For those cases, and potentially other uses in
1900 // the future, always build zero vectors as <4 x i32> or <2 x i32> bitcasted
1901 // to their dest type. This ensures they get CSE'd.
1902 SDValue Vec;
1903 SDValue Cst = DAG.getTargetConstant(0, MVT::i32);
1904 if (VT.getSizeInBits() == 64)
1905 Vec = DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v2i32, Cst, Cst);
1906 else
1907 Vec = DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v4i32, Cst, Cst, Cst, Cst);
1908
1909 return DAG.getNode(ISD::BIT_CONVERT, dl, VT, Vec);
1910}
1911
1912/// getOnesVector - Returns a vector of specified type with all bits set.
1913///
1914static SDValue getOnesVector(MVT VT, SelectionDAG &DAG, DebugLoc dl) {
1915 assert(VT.isVector() && "Expected a vector type");
1916
1917 // Always build ones vectors as <4 x i32> or <2 x i32> bitcasted to their dest
1918 // type. This ensures they get CSE'd.
1919 SDValue Vec;
1920 SDValue Cst = DAG.getTargetConstant(~0U, MVT::i32);
1921 if (VT.getSizeInBits() == 64)
1922 Vec = DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v2i32, Cst, Cst);
1923 else
1924 Vec = DAG.getNode(ISD::BUILD_VECTOR, dl, MVT::v4i32, Cst, Cst, Cst, Cst);
1925
1926 return DAG.getNode(ISD::BIT_CONVERT, dl, VT, Vec);
1927}
1928
1929static SDValue LowerShift(SDNode *N, SelectionDAG &DAG,
1930 const ARMSubtarget *ST) {
1931 MVT VT = N->getValueType(0);
1932 DebugLoc dl = N->getDebugLoc();
1933
1934 // Lower vector shifts on NEON to use VSHL.
1935 if (VT.isVector()) {
1936 assert(ST->hasNEON() && "unexpected vector shift");
1937
1938 // Left shifts translate directly to the vshiftu intrinsic.
1939 if (N->getOpcode() == ISD::SHL)
1940 return DAG.getNode(ISD::INTRINSIC_WO_CHAIN, dl, VT,
1941 DAG.getConstant(Intrinsic::arm_neon_vshiftu, MVT::i32),
1942 N->getOperand(0), N->getOperand(1));
1943
1944 assert((N->getOpcode() == ISD::SRA ||
1945 N->getOpcode() == ISD::SRL) && "unexpected vector shift opcode");
1946
1947 // NEON uses the same intrinsics for both left and right shifts. For
1948 // right shifts, the shift amounts are negative, so negate the vector of
1949 // shift amounts.
1950 MVT ShiftVT = N->getOperand(1).getValueType();
1951 SDValue NegatedCount = DAG.getNode(ISD::SUB, dl, ShiftVT,
1952 getZeroVector(ShiftVT, DAG, dl),
1953 N->getOperand(1));
1954 Intrinsic::ID vshiftInt = (N->getOpcode() == ISD::SRA ?
1955 Intrinsic::arm_neon_vshifts :
1956 Intrinsic::arm_neon_vshiftu);
1957 return DAG.getNode(ISD::INTRINSIC_WO_CHAIN, dl, VT,
1958 DAG.getConstant(vshiftInt, MVT::i32),
1959 N->getOperand(0), NegatedCount);
1960 }
1961
1962 assert(VT == MVT::i64 &&
Chris Lattner27a6c732007-11-24 07:07:01 +00001963 (N->getOpcode() == ISD::SRL || N->getOpcode() == ISD::SRA) &&
1964 "Unknown shift to lower!");
Duncan Sands1607f052008-12-01 11:39:25 +00001965
Chris Lattner27a6c732007-11-24 07:07:01 +00001966 // We only lower SRA, SRL of 1 here, all others use generic lowering.
1967 if (!isa<ConstantSDNode>(N->getOperand(1)) ||
Dan Gohmanf5aeb1a2008-09-12 16:56:44 +00001968 cast<ConstantSDNode>(N->getOperand(1))->getZExtValue() != 1)
Duncan Sands1607f052008-12-01 11:39:25 +00001969 return SDValue();
Bob Wilson2dc4f542009-03-20 22:42:55 +00001970
Chris Lattner27a6c732007-11-24 07:07:01 +00001971 // If we are in thumb mode, we don't have RRX.
Duncan Sands1607f052008-12-01 11:39:25 +00001972 if (ST->isThumb()) return SDValue();
Bob Wilson2dc4f542009-03-20 22:42:55 +00001973
Chris Lattner27a6c732007-11-24 07:07:01 +00001974 // Okay, we have a 64-bit SRA or SRL of 1. Lower this to an RRX expr.
Dale Johannesende064702009-02-06 21:50:26 +00001975 SDValue Lo = DAG.getNode(ISD::EXTRACT_ELEMENT, dl, MVT::i32, N->getOperand(0),
Chris Lattner27a6c732007-11-24 07:07:01 +00001976 DAG.getConstant(0, MVT::i32));
Dale Johannesende064702009-02-06 21:50:26 +00001977 SDValue Hi = DAG.getNode(ISD::EXTRACT_ELEMENT, dl, MVT::i32, N->getOperand(0),
Chris Lattner27a6c732007-11-24 07:07:01 +00001978 DAG.getConstant(1, MVT::i32));
Bob Wilson2dc4f542009-03-20 22:42:55 +00001979
Chris Lattner27a6c732007-11-24 07:07:01 +00001980 // First, build a SRA_FLAG/SRL_FLAG op, which shifts the top part by one and
1981 // captures the result into a carry flag.
1982 unsigned Opc = N->getOpcode() == ISD::SRL ? ARMISD::SRL_FLAG:ARMISD::SRA_FLAG;
Dale Johannesende064702009-02-06 21:50:26 +00001983 Hi = DAG.getNode(Opc, dl, DAG.getVTList(MVT::i32, MVT::Flag), &Hi, 1);
Bob Wilson2dc4f542009-03-20 22:42:55 +00001984
Chris Lattner27a6c732007-11-24 07:07:01 +00001985 // The low part is an ARMISD::RRX operand, which shifts the carry in.
Dale Johannesende064702009-02-06 21:50:26 +00001986 Lo = DAG.getNode(ARMISD::RRX, dl, MVT::i32, Lo, Hi.getValue(1));
Bob Wilson2dc4f542009-03-20 22:42:55 +00001987
Chris Lattner27a6c732007-11-24 07:07:01 +00001988 // Merge the pieces into a single i64 value.
Dale Johannesende064702009-02-06 21:50:26 +00001989 return DAG.getNode(ISD::BUILD_PAIR, dl, MVT::i64, Lo, Hi);
Chris Lattner27a6c732007-11-24 07:07:01 +00001990}
1991
Bob Wilson5bafff32009-06-22 23:27:02 +00001992static SDValue LowerVSETCC(SDValue Op, SelectionDAG &DAG) {
1993 SDValue TmpOp0, TmpOp1;
1994 bool Invert = false;
1995 bool Swap = false;
1996 unsigned Opc = 0;
1997
1998 SDValue Op0 = Op.getOperand(0);
1999 SDValue Op1 = Op.getOperand(1);
2000 SDValue CC = Op.getOperand(2);
2001 MVT VT = Op.getValueType();
2002 ISD::CondCode SetCCOpcode = cast<CondCodeSDNode>(CC)->get();
2003 DebugLoc dl = Op.getDebugLoc();
2004
2005 if (Op.getOperand(1).getValueType().isFloatingPoint()) {
2006 switch (SetCCOpcode) {
2007 default: assert(0 && "Illegal FP comparison"); break;
2008 case ISD::SETUNE:
2009 case ISD::SETNE: Invert = true; // Fallthrough
2010 case ISD::SETOEQ:
2011 case ISD::SETEQ: Opc = ARMISD::VCEQ; break;
2012 case ISD::SETOLT:
2013 case ISD::SETLT: Swap = true; // Fallthrough
2014 case ISD::SETOGT:
2015 case ISD::SETGT: Opc = ARMISD::VCGT; break;
2016 case ISD::SETOLE:
2017 case ISD::SETLE: Swap = true; // Fallthrough
2018 case ISD::SETOGE:
2019 case ISD::SETGE: Opc = ARMISD::VCGE; break;
2020 case ISD::SETUGE: Swap = true; // Fallthrough
2021 case ISD::SETULE: Invert = true; Opc = ARMISD::VCGT; break;
2022 case ISD::SETUGT: Swap = true; // Fallthrough
2023 case ISD::SETULT: Invert = true; Opc = ARMISD::VCGE; break;
2024 case ISD::SETUEQ: Invert = true; // Fallthrough
2025 case ISD::SETONE:
2026 // Expand this to (OLT | OGT).
2027 TmpOp0 = Op0;
2028 TmpOp1 = Op1;
2029 Opc = ISD::OR;
2030 Op0 = DAG.getNode(ARMISD::VCGT, dl, VT, TmpOp1, TmpOp0);
2031 Op1 = DAG.getNode(ARMISD::VCGT, dl, VT, TmpOp0, TmpOp1);
2032 break;
2033 case ISD::SETUO: Invert = true; // Fallthrough
2034 case ISD::SETO:
2035 // Expand this to (OLT | OGE).
2036 TmpOp0 = Op0;
2037 TmpOp1 = Op1;
2038 Opc = ISD::OR;
2039 Op0 = DAG.getNode(ARMISD::VCGT, dl, VT, TmpOp1, TmpOp0);
2040 Op1 = DAG.getNode(ARMISD::VCGE, dl, VT, TmpOp0, TmpOp1);
2041 break;
2042 }
2043 } else {
2044 // Integer comparisons.
2045 switch (SetCCOpcode) {
2046 default: assert(0 && "Illegal integer comparison"); break;
2047 case ISD::SETNE: Invert = true;
2048 case ISD::SETEQ: Opc = ARMISD::VCEQ; break;
2049 case ISD::SETLT: Swap = true;
2050 case ISD::SETGT: Opc = ARMISD::VCGT; break;
2051 case ISD::SETLE: Swap = true;
2052 case ISD::SETGE: Opc = ARMISD::VCGE; break;
2053 case ISD::SETULT: Swap = true;
2054 case ISD::SETUGT: Opc = ARMISD::VCGTU; break;
2055 case ISD::SETULE: Swap = true;
2056 case ISD::SETUGE: Opc = ARMISD::VCGEU; break;
2057 }
2058
2059 // Detect VTST (Vector Test Bits) = vicmp ne (and (op0, op1), zero).
2060 if (Opc == ARMISD::VCEQ) {
2061
2062 SDValue AndOp;
2063 if (ISD::isBuildVectorAllZeros(Op1.getNode()))
2064 AndOp = Op0;
2065 else if (ISD::isBuildVectorAllZeros(Op0.getNode()))
2066 AndOp = Op1;
2067
2068 // Ignore bitconvert.
2069 if (AndOp.getNode() && AndOp.getOpcode() == ISD::BIT_CONVERT)
2070 AndOp = AndOp.getOperand(0);
2071
2072 if (AndOp.getNode() && AndOp.getOpcode() == ISD::AND) {
2073 Opc = ARMISD::VTST;
2074 Op0 = DAG.getNode(ISD::BIT_CONVERT, dl, VT, AndOp.getOperand(0));
2075 Op1 = DAG.getNode(ISD::BIT_CONVERT, dl, VT, AndOp.getOperand(1));
2076 Invert = !Invert;
2077 }
2078 }
2079 }
2080
2081 if (Swap)
2082 std::swap(Op0, Op1);
2083
2084 SDValue Result = DAG.getNode(Opc, dl, VT, Op0, Op1);
2085
2086 if (Invert)
2087 Result = DAG.getNOT(dl, Result, VT);
2088
2089 return Result;
2090}
2091
2092/// isVMOVSplat - Check if the specified splat value corresponds to an immediate
2093/// VMOV instruction, and if so, return the constant being splatted.
2094static SDValue isVMOVSplat(uint64_t SplatBits, uint64_t SplatUndef,
2095 unsigned SplatBitSize, SelectionDAG &DAG) {
2096 switch (SplatBitSize) {
2097 case 8:
2098 // Any 1-byte value is OK.
2099 assert((SplatBits & ~0xff) == 0 && "one byte splat value is too big");
2100 return DAG.getTargetConstant(SplatBits, MVT::i8);
2101
2102 case 16:
2103 // NEON's 16-bit VMOV supports splat values where only one byte is nonzero.
2104 if ((SplatBits & ~0xff) == 0 ||
2105 (SplatBits & ~0xff00) == 0)
2106 return DAG.getTargetConstant(SplatBits, MVT::i16);
2107 break;
2108
2109 case 32:
2110 // NEON's 32-bit VMOV supports splat values where:
2111 // * only one byte is nonzero, or
2112 // * the least significant byte is 0xff and the second byte is nonzero, or
2113 // * the least significant 2 bytes are 0xff and the third is nonzero.
2114 if ((SplatBits & ~0xff) == 0 ||
2115 (SplatBits & ~0xff00) == 0 ||
2116 (SplatBits & ~0xff0000) == 0 ||
2117 (SplatBits & ~0xff000000) == 0)
2118 return DAG.getTargetConstant(SplatBits, MVT::i32);
2119
2120 if ((SplatBits & ~0xffff) == 0 &&
2121 ((SplatBits | SplatUndef) & 0xff) == 0xff)
2122 return DAG.getTargetConstant(SplatBits | 0xff, MVT::i32);
2123
2124 if ((SplatBits & ~0xffffff) == 0 &&
2125 ((SplatBits | SplatUndef) & 0xffff) == 0xffff)
2126 return DAG.getTargetConstant(SplatBits | 0xffff, MVT::i32);
2127
2128 // Note: there are a few 32-bit splat values (specifically: 00ffff00,
2129 // ff000000, ff0000ff, and ffff00ff) that are valid for VMOV.I64 but not
2130 // VMOV.I32. A (very) minor optimization would be to replicate the value
2131 // and fall through here to test for a valid 64-bit splat. But, then the
2132 // caller would also need to check and handle the change in size.
2133 break;
2134
2135 case 64: {
2136 // NEON has a 64-bit VMOV splat where each byte is either 0 or 0xff.
2137 uint64_t BitMask = 0xff;
2138 uint64_t Val = 0;
2139 for (int ByteNum = 0; ByteNum < 8; ++ByteNum) {
2140 if (((SplatBits | SplatUndef) & BitMask) == BitMask)
2141 Val |= BitMask;
2142 else if ((SplatBits & BitMask) != 0)
2143 return SDValue();
2144 BitMask <<= 8;
2145 }
2146 return DAG.getTargetConstant(Val, MVT::i64);
2147 }
2148
2149 default:
2150 assert(0 && "unexpected size for isVMOVSplat");
2151 break;
2152 }
2153
2154 return SDValue();
2155}
2156
2157/// getVMOVImm - If this is a build_vector of constants which can be
2158/// formed by using a VMOV instruction of the specified element size,
2159/// return the constant being splatted. The ByteSize field indicates the
2160/// number of bytes of each element [1248].
2161SDValue ARM::getVMOVImm(SDNode *N, unsigned ByteSize, SelectionDAG &DAG) {
2162 BuildVectorSDNode *BVN = dyn_cast<BuildVectorSDNode>(N);
2163 APInt SplatBits, SplatUndef;
2164 unsigned SplatBitSize;
2165 bool HasAnyUndefs;
2166 if (! BVN || ! BVN->isConstantSplat(SplatBits, SplatUndef, SplatBitSize,
2167 HasAnyUndefs, ByteSize * 8))
2168 return SDValue();
2169
2170 if (SplatBitSize > ByteSize * 8)
2171 return SDValue();
2172
2173 return isVMOVSplat(SplatBits.getZExtValue(), SplatUndef.getZExtValue(),
2174 SplatBitSize, DAG);
2175}
2176
2177static SDValue BuildSplat(SDValue Val, MVT VT, SelectionDAG &DAG, DebugLoc dl) {
2178 // Canonicalize all-zeros and all-ones vectors.
2179 ConstantSDNode *ConstVal = dyn_cast<ConstantSDNode>(Val.getNode());
2180 if (ConstVal->isNullValue())
2181 return getZeroVector(VT, DAG, dl);
2182 if (ConstVal->isAllOnesValue())
2183 return getOnesVector(VT, DAG, dl);
2184
2185 MVT CanonicalVT;
2186 if (VT.is64BitVector()) {
2187 switch (Val.getValueType().getSizeInBits()) {
2188 case 8: CanonicalVT = MVT::v8i8; break;
2189 case 16: CanonicalVT = MVT::v4i16; break;
2190 case 32: CanonicalVT = MVT::v2i32; break;
2191 case 64: CanonicalVT = MVT::v1i64; break;
2192 default: assert(0 && "unexpected splat element type"); break;
2193 }
2194 } else {
2195 assert(VT.is128BitVector() && "unknown splat vector size");
2196 switch (Val.getValueType().getSizeInBits()) {
2197 case 8: CanonicalVT = MVT::v16i8; break;
2198 case 16: CanonicalVT = MVT::v8i16; break;
2199 case 32: CanonicalVT = MVT::v4i32; break;
2200 case 64: CanonicalVT = MVT::v2i64; break;
2201 default: assert(0 && "unexpected splat element type"); break;
2202 }
2203 }
2204
2205 // Build a canonical splat for this value.
2206 SmallVector<SDValue, 8> Ops;
2207 Ops.assign(CanonicalVT.getVectorNumElements(), Val);
2208 SDValue Res = DAG.getNode(ISD::BUILD_VECTOR, dl, CanonicalVT, &Ops[0],
2209 Ops.size());
2210 return DAG.getNode(ISD::BIT_CONVERT, dl, VT, Res);
2211}
2212
2213// If this is a case we can't handle, return null and let the default
2214// expansion code take care of it.
2215static SDValue LowerBUILD_VECTOR(SDValue Op, SelectionDAG &DAG) {
2216 BuildVectorSDNode *BVN = dyn_cast<BuildVectorSDNode>(Op.getNode());
2217 assert(BVN != 0 && "Expected a BuildVectorSDNode in LowerBUILD_VECTOR");
2218 DebugLoc dl = Op.getDebugLoc();
2219
2220 APInt SplatBits, SplatUndef;
2221 unsigned SplatBitSize;
2222 bool HasAnyUndefs;
2223 if (BVN->isConstantSplat(SplatBits, SplatUndef, SplatBitSize, HasAnyUndefs)) {
2224 SDValue Val = isVMOVSplat(SplatBits.getZExtValue(),
2225 SplatUndef.getZExtValue(), SplatBitSize, DAG);
2226 if (Val.getNode())
2227 return BuildSplat(Val, Op.getValueType(), DAG, dl);
2228 }
2229
2230 return SDValue();
2231}
2232
2233static SDValue LowerVECTOR_SHUFFLE(SDValue Op, SelectionDAG &DAG) {
2234 return Op;
2235}
2236
2237static SDValue LowerSCALAR_TO_VECTOR(SDValue Op, SelectionDAG &DAG) {
2238 return Op;
2239}
2240
2241static SDValue LowerEXTRACT_VECTOR_ELT(SDValue Op, SelectionDAG &DAG) {
2242 MVT VT = Op.getValueType();
2243 DebugLoc dl = Op.getDebugLoc();
2244 assert((VT == MVT::i8 || VT == MVT::i16) &&
2245 "unexpected type for custom-lowering vector extract");
2246 SDValue Vec = Op.getOperand(0);
2247 SDValue Lane = Op.getOperand(1);
2248 Op = DAG.getNode(ARMISD::VGETLANEu, dl, MVT::i32, Vec, Lane);
2249 Op = DAG.getNode(ISD::AssertZext, dl, MVT::i32, Op, DAG.getValueType(VT));
2250 return DAG.getNode(ISD::TRUNCATE, dl, VT, Op);
2251}
2252
2253static SDValue LowerCONCAT_VECTORS(SDValue Op) {
2254 if (Op.getValueType().is128BitVector() && Op.getNumOperands() == 2)
2255 return Op;
2256 return SDValue();
2257}
2258
Dan Gohman475871a2008-07-27 21:46:04 +00002259SDValue ARMTargetLowering::LowerOperation(SDValue Op, SelectionDAG &DAG) {
Evan Chenga8e29892007-01-19 07:51:42 +00002260 switch (Op.getOpcode()) {
2261 default: assert(0 && "Don't know how to custom lower this!"); abort();
2262 case ISD::ConstantPool: return LowerConstantPool(Op, DAG);
Lauro Ramos Venancio0ae4a332007-04-22 00:04:12 +00002263 case ISD::GlobalAddress:
2264 return Subtarget->isTargetDarwin() ? LowerGlobalAddressDarwin(Op, DAG) :
2265 LowerGlobalAddressELF(Op, DAG);
Lauro Ramos Venancio64f4fa52007-04-27 13:54:47 +00002266 case ISD::GlobalTLSAddress: return LowerGlobalTLSAddress(Op, DAG);
Evan Chenga8e29892007-01-19 07:51:42 +00002267 case ISD::CALL: return LowerCALL(Op, DAG);
2268 case ISD::RET: return LowerRET(Op, DAG);
2269 case ISD::SELECT_CC: return LowerSELECT_CC(Op, DAG, Subtarget);
2270 case ISD::BR_CC: return LowerBR_CC(Op, DAG, Subtarget);
2271 case ISD::BR_JT: return LowerBR_JT(Op, DAG);
2272 case ISD::VASTART: return LowerVASTART(Op, DAG, VarArgsFrameIndex);
2273 case ISD::SINT_TO_FP:
2274 case ISD::UINT_TO_FP: return LowerINT_TO_FP(Op, DAG);
2275 case ISD::FP_TO_SINT:
2276 case ISD::FP_TO_UINT: return LowerFP_TO_INT(Op, DAG);
2277 case ISD::FCOPYSIGN: return LowerFCOPYSIGN(Op, DAG);
Chris Lattner27a6c732007-11-24 07:07:01 +00002278 case ISD::FORMAL_ARGUMENTS: return LowerFORMAL_ARGUMENTS(Op, DAG);
Nate Begemanbcc5f362007-01-29 22:58:52 +00002279 case ISD::RETURNADDR: break;
Jim Grosbach0e0da732009-05-12 23:59:14 +00002280 case ISD::FRAMEADDR: return LowerFRAMEADDR(Op, DAG);
Lauro Ramos Venancio0ae4a332007-04-22 00:04:12 +00002281 case ISD::GLOBAL_OFFSET_TABLE: return LowerGLOBAL_OFFSET_TABLE(Op, DAG);
Lauro Ramos Venancioe0cb36b2007-11-08 17:20:05 +00002282 case ISD::INTRINSIC_WO_CHAIN: return LowerINTRINSIC_WO_CHAIN(Op, DAG);
Duncan Sands1607f052008-12-01 11:39:25 +00002283 case ISD::BIT_CONVERT: return ExpandBIT_CONVERT(Op.getNode(), DAG);
Bob Wilson5bafff32009-06-22 23:27:02 +00002284 case ISD::SHL:
Chris Lattner27a6c732007-11-24 07:07:01 +00002285 case ISD::SRL:
Bob Wilson5bafff32009-06-22 23:27:02 +00002286 case ISD::SRA: return LowerShift(Op.getNode(), DAG, Subtarget);
2287 case ISD::VSETCC: return LowerVSETCC(Op, DAG);
2288 case ISD::BUILD_VECTOR: return LowerBUILD_VECTOR(Op, DAG);
2289 case ISD::VECTOR_SHUFFLE: return LowerVECTOR_SHUFFLE(Op, DAG);
2290 case ISD::SCALAR_TO_VECTOR: return LowerSCALAR_TO_VECTOR(Op, DAG);
2291 case ISD::EXTRACT_VECTOR_ELT: return LowerEXTRACT_VECTOR_ELT(Op, DAG);
2292 case ISD::CONCAT_VECTORS: return LowerCONCAT_VECTORS(Op);
Evan Chenga8e29892007-01-19 07:51:42 +00002293 }
Dan Gohman475871a2008-07-27 21:46:04 +00002294 return SDValue();
Evan Chenga8e29892007-01-19 07:51:42 +00002295}
2296
Duncan Sands1607f052008-12-01 11:39:25 +00002297/// ReplaceNodeResults - Replace the results of node with an illegal result
2298/// type with new values built out of custom code.
Duncan Sands1607f052008-12-01 11:39:25 +00002299void ARMTargetLowering::ReplaceNodeResults(SDNode *N,
2300 SmallVectorImpl<SDValue>&Results,
2301 SelectionDAG &DAG) {
Chris Lattner27a6c732007-11-24 07:07:01 +00002302 switch (N->getOpcode()) {
Duncan Sands1607f052008-12-01 11:39:25 +00002303 default:
2304 assert(0 && "Don't know how to custom expand this!");
2305 return;
2306 case ISD::BIT_CONVERT:
2307 Results.push_back(ExpandBIT_CONVERT(N, DAG));
2308 return;
Chris Lattner27a6c732007-11-24 07:07:01 +00002309 case ISD::SRL:
Duncan Sands1607f052008-12-01 11:39:25 +00002310 case ISD::SRA: {
Bob Wilson5bafff32009-06-22 23:27:02 +00002311 SDValue Res = LowerShift(N, DAG, Subtarget);
Duncan Sands1607f052008-12-01 11:39:25 +00002312 if (Res.getNode())
2313 Results.push_back(Res);
2314 return;
2315 }
Chris Lattner27a6c732007-11-24 07:07:01 +00002316 }
2317}
Chris Lattner27a6c732007-11-24 07:07:01 +00002318
Evan Chenga8e29892007-01-19 07:51:42 +00002319//===----------------------------------------------------------------------===//
2320// ARM Scheduler Hooks
2321//===----------------------------------------------------------------------===//
2322
2323MachineBasicBlock *
Evan Chengff9b3732008-01-30 18:18:23 +00002324ARMTargetLowering::EmitInstrWithCustomInserter(MachineInstr *MI,
Dan Gohman1fdbc1d2009-02-07 16:15:20 +00002325 MachineBasicBlock *BB) const {
Evan Chenga8e29892007-01-19 07:51:42 +00002326 const TargetInstrInfo *TII = getTargetMachine().getInstrInfo();
Dale Johannesenb6728402009-02-13 02:25:56 +00002327 DebugLoc dl = MI->getDebugLoc();
Evan Chenga8e29892007-01-19 07:51:42 +00002328 switch (MI->getOpcode()) {
2329 default: assert(false && "Unexpected instr type to insert");
2330 case ARM::tMOVCCr: {
2331 // To "insert" a SELECT_CC instruction, we actually have to insert the
2332 // diamond control-flow pattern. The incoming instruction knows the
2333 // destination vreg to set, the condition code register to branch on, the
2334 // true/false values to select between, and a branch opcode to use.
2335 const BasicBlock *LLVM_BB = BB->getBasicBlock();
Dan Gohman8e5f2c62008-07-07 23:14:23 +00002336 MachineFunction::iterator It = BB;
Evan Chenga8e29892007-01-19 07:51:42 +00002337 ++It;
2338
2339 // thisMBB:
2340 // ...
2341 // TrueVal = ...
2342 // cmpTY ccX, r1, r2
2343 // bCC copy1MBB
2344 // fallthrough --> copy0MBB
2345 MachineBasicBlock *thisMBB = BB;
Dan Gohman8e5f2c62008-07-07 23:14:23 +00002346 MachineFunction *F = BB->getParent();
2347 MachineBasicBlock *copy0MBB = F->CreateMachineBasicBlock(LLVM_BB);
2348 MachineBasicBlock *sinkMBB = F->CreateMachineBasicBlock(LLVM_BB);
Dale Johannesenb6728402009-02-13 02:25:56 +00002349 BuildMI(BB, dl, TII->get(ARM::tBcc)).addMBB(sinkMBB)
Evan Cheng0e1d3792007-07-05 07:18:20 +00002350 .addImm(MI->getOperand(3).getImm()).addReg(MI->getOperand(4).getReg());
Dan Gohman8e5f2c62008-07-07 23:14:23 +00002351 F->insert(It, copy0MBB);
2352 F->insert(It, sinkMBB);
Evan Chenga8e29892007-01-19 07:51:42 +00002353 // Update machine-CFG edges by first adding all successors of the current
2354 // block to the new block which will contain the Phi node for the select.
2355 for(MachineBasicBlock::succ_iterator i = BB->succ_begin(),
2356 e = BB->succ_end(); i != e; ++i)
2357 sinkMBB->addSuccessor(*i);
2358 // Next, remove all successors of the current block, and add the true
2359 // and fallthrough blocks as its successors.
2360 while(!BB->succ_empty())
2361 BB->removeSuccessor(BB->succ_begin());
2362 BB->addSuccessor(copy0MBB);
2363 BB->addSuccessor(sinkMBB);
2364
2365 // copy0MBB:
2366 // %FalseValue = ...
2367 // # fallthrough to sinkMBB
2368 BB = copy0MBB;
2369
2370 // Update machine-CFG edges
2371 BB->addSuccessor(sinkMBB);
2372
2373 // sinkMBB:
2374 // %Result = phi [ %FalseValue, copy0MBB ], [ %TrueValue, thisMBB ]
2375 // ...
2376 BB = sinkMBB;
Dale Johannesenb6728402009-02-13 02:25:56 +00002377 BuildMI(BB, dl, TII->get(ARM::PHI), MI->getOperand(0).getReg())
Evan Chenga8e29892007-01-19 07:51:42 +00002378 .addReg(MI->getOperand(1).getReg()).addMBB(copy0MBB)
2379 .addReg(MI->getOperand(2).getReg()).addMBB(thisMBB);
2380
Dan Gohman8e5f2c62008-07-07 23:14:23 +00002381 F->DeleteMachineInstr(MI); // The pseudo instruction is gone now.
Evan Chenga8e29892007-01-19 07:51:42 +00002382 return BB;
2383 }
2384 }
2385}
2386
2387//===----------------------------------------------------------------------===//
2388// ARM Optimization Hooks
2389//===----------------------------------------------------------------------===//
2390
Chris Lattnerd1980a52009-03-12 06:52:53 +00002391static
2392SDValue combineSelectAndUse(SDNode *N, SDValue Slct, SDValue OtherOp,
2393 TargetLowering::DAGCombinerInfo &DCI) {
Chris Lattnerd1980a52009-03-12 06:52:53 +00002394 SelectionDAG &DAG = DCI.DAG;
2395 const TargetLowering &TLI = DAG.getTargetLoweringInfo();
2396 MVT VT = N->getValueType(0);
2397 unsigned Opc = N->getOpcode();
2398 bool isSlctCC = Slct.getOpcode() == ISD::SELECT_CC;
2399 SDValue LHS = isSlctCC ? Slct.getOperand(2) : Slct.getOperand(1);
2400 SDValue RHS = isSlctCC ? Slct.getOperand(3) : Slct.getOperand(2);
2401 ISD::CondCode CC = ISD::SETCC_INVALID;
2402
2403 if (isSlctCC) {
2404 CC = cast<CondCodeSDNode>(Slct.getOperand(4))->get();
2405 } else {
2406 SDValue CCOp = Slct.getOperand(0);
2407 if (CCOp.getOpcode() == ISD::SETCC)
2408 CC = cast<CondCodeSDNode>(CCOp.getOperand(2))->get();
2409 }
2410
2411 bool DoXform = false;
2412 bool InvCC = false;
2413 assert ((Opc == ISD::ADD || (Opc == ISD::SUB && Slct == N->getOperand(1))) &&
2414 "Bad input!");
2415
2416 if (LHS.getOpcode() == ISD::Constant &&
2417 cast<ConstantSDNode>(LHS)->isNullValue()) {
2418 DoXform = true;
2419 } else if (CC != ISD::SETCC_INVALID &&
2420 RHS.getOpcode() == ISD::Constant &&
2421 cast<ConstantSDNode>(RHS)->isNullValue()) {
2422 std::swap(LHS, RHS);
2423 SDValue Op0 = Slct.getOperand(0);
2424 MVT OpVT = isSlctCC ? Op0.getValueType() :
2425 Op0.getOperand(0).getValueType();
2426 bool isInt = OpVT.isInteger();
2427 CC = ISD::getSetCCInverse(CC, isInt);
2428
2429 if (!TLI.isCondCodeLegal(CC, OpVT))
2430 return SDValue(); // Inverse operator isn't legal.
2431
2432 DoXform = true;
2433 InvCC = true;
2434 }
2435
2436 if (DoXform) {
2437 SDValue Result = DAG.getNode(Opc, RHS.getDebugLoc(), VT, OtherOp, RHS);
2438 if (isSlctCC)
2439 return DAG.getSelectCC(N->getDebugLoc(), OtherOp, Result,
2440 Slct.getOperand(0), Slct.getOperand(1), CC);
2441 SDValue CCOp = Slct.getOperand(0);
2442 if (InvCC)
2443 CCOp = DAG.getSetCC(Slct.getDebugLoc(), CCOp.getValueType(),
2444 CCOp.getOperand(0), CCOp.getOperand(1), CC);
2445 return DAG.getNode(ISD::SELECT, N->getDebugLoc(), VT,
2446 CCOp, OtherOp, Result);
2447 }
2448 return SDValue();
2449}
2450
2451/// PerformADDCombine - Target-specific dag combine xforms for ISD::ADD.
2452static SDValue PerformADDCombine(SDNode *N,
2453 TargetLowering::DAGCombinerInfo &DCI) {
2454 // added by evan in r37685 with no testcase.
2455 SDValue N0 = N->getOperand(0), N1 = N->getOperand(1);
Bob Wilson2dc4f542009-03-20 22:42:55 +00002456
Chris Lattnerd1980a52009-03-12 06:52:53 +00002457 // fold (add (select cc, 0, c), x) -> (select cc, x, (add, x, c))
2458 if (N0.getOpcode() == ISD::SELECT && N0.getNode()->hasOneUse()) {
2459 SDValue Result = combineSelectAndUse(N, N0, N1, DCI);
2460 if (Result.getNode()) return Result;
2461 }
2462 if (N1.getOpcode() == ISD::SELECT && N1.getNode()->hasOneUse()) {
2463 SDValue Result = combineSelectAndUse(N, N1, N0, DCI);
2464 if (Result.getNode()) return Result;
2465 }
Bob Wilson2dc4f542009-03-20 22:42:55 +00002466
Chris Lattnerd1980a52009-03-12 06:52:53 +00002467 return SDValue();
2468}
2469
2470/// PerformSUBCombine - Target-specific dag combine xforms for ISD::SUB.
2471static SDValue PerformSUBCombine(SDNode *N,
2472 TargetLowering::DAGCombinerInfo &DCI) {
2473 // added by evan in r37685 with no testcase.
2474 SDValue N0 = N->getOperand(0), N1 = N->getOperand(1);
Bob Wilson2dc4f542009-03-20 22:42:55 +00002475
Chris Lattnerd1980a52009-03-12 06:52:53 +00002476 // fold (sub x, (select cc, 0, c)) -> (select cc, x, (sub, x, c))
2477 if (N1.getOpcode() == ISD::SELECT && N1.getNode()->hasOneUse()) {
2478 SDValue Result = combineSelectAndUse(N, N1, N0, DCI);
2479 if (Result.getNode()) return Result;
2480 }
Bob Wilson2dc4f542009-03-20 22:42:55 +00002481
Chris Lattnerd1980a52009-03-12 06:52:53 +00002482 return SDValue();
2483}
2484
2485
Chris Lattnerf1b1c5e2007-11-27 22:36:16 +00002486/// PerformFMRRDCombine - Target-specific dag combine xforms for ARMISD::FMRRD.
Bob Wilson2dc4f542009-03-20 22:42:55 +00002487static SDValue PerformFMRRDCombine(SDNode *N,
2488 TargetLowering::DAGCombinerInfo &DCI) {
Chris Lattnerf1b1c5e2007-11-27 22:36:16 +00002489 // fmrrd(fmdrr x, y) -> x,y
Dan Gohman475871a2008-07-27 21:46:04 +00002490 SDValue InDouble = N->getOperand(0);
Chris Lattnerf1b1c5e2007-11-27 22:36:16 +00002491 if (InDouble.getOpcode() == ARMISD::FMDRR)
2492 return DCI.CombineTo(N, InDouble.getOperand(0), InDouble.getOperand(1));
Dan Gohman475871a2008-07-27 21:46:04 +00002493 return SDValue();
Chris Lattnerf1b1c5e2007-11-27 22:36:16 +00002494}
2495
Bob Wilson5bafff32009-06-22 23:27:02 +00002496/// getVShiftImm - Check if this is a valid build_vector for the immediate
2497/// operand of a vector shift operation, where all the elements of the
2498/// build_vector must have the same constant integer value.
2499static bool getVShiftImm(SDValue Op, unsigned ElementBits, int64_t &Cnt) {
2500 // Ignore bit_converts.
2501 while (Op.getOpcode() == ISD::BIT_CONVERT)
2502 Op = Op.getOperand(0);
2503 BuildVectorSDNode *BVN = dyn_cast<BuildVectorSDNode>(Op.getNode());
2504 APInt SplatBits, SplatUndef;
2505 unsigned SplatBitSize;
2506 bool HasAnyUndefs;
2507 if (! BVN || ! BVN->isConstantSplat(SplatBits, SplatUndef, SplatBitSize,
2508 HasAnyUndefs, ElementBits) ||
2509 SplatBitSize > ElementBits)
2510 return false;
2511 Cnt = SplatBits.getSExtValue();
2512 return true;
2513}
2514
2515/// isVShiftLImm - Check if this is a valid build_vector for the immediate
2516/// operand of a vector shift left operation. That value must be in the range:
2517/// 0 <= Value < ElementBits for a left shift; or
2518/// 0 <= Value <= ElementBits for a long left shift.
2519static bool isVShiftLImm(SDValue Op, MVT VT, bool isLong, int64_t &Cnt) {
2520 assert(VT.isVector() && "vector shift count is not a vector type");
2521 unsigned ElementBits = VT.getVectorElementType().getSizeInBits();
2522 if (! getVShiftImm(Op, ElementBits, Cnt))
2523 return false;
2524 return (Cnt >= 0 && (isLong ? Cnt-1 : Cnt) < ElementBits);
2525}
2526
2527/// isVShiftRImm - Check if this is a valid build_vector for the immediate
2528/// operand of a vector shift right operation. For a shift opcode, the value
2529/// is positive, but for an intrinsic the value count must be negative. The
2530/// absolute value must be in the range:
2531/// 1 <= |Value| <= ElementBits for a right shift; or
2532/// 1 <= |Value| <= ElementBits/2 for a narrow right shift.
2533static bool isVShiftRImm(SDValue Op, MVT VT, bool isNarrow, bool isIntrinsic,
2534 int64_t &Cnt) {
2535 assert(VT.isVector() && "vector shift count is not a vector type");
2536 unsigned ElementBits = VT.getVectorElementType().getSizeInBits();
2537 if (! getVShiftImm(Op, ElementBits, Cnt))
2538 return false;
2539 if (isIntrinsic)
2540 Cnt = -Cnt;
2541 return (Cnt >= 1 && Cnt <= (isNarrow ? ElementBits/2 : ElementBits));
2542}
2543
2544/// PerformIntrinsicCombine - ARM-specific DAG combining for intrinsics.
2545static SDValue PerformIntrinsicCombine(SDNode *N, SelectionDAG &DAG) {
2546 unsigned IntNo = cast<ConstantSDNode>(N->getOperand(0))->getZExtValue();
2547 switch (IntNo) {
2548 default:
2549 // Don't do anything for most intrinsics.
2550 break;
2551
2552 // Vector shifts: check for immediate versions and lower them.
2553 // Note: This is done during DAG combining instead of DAG legalizing because
2554 // the build_vectors for 64-bit vector element shift counts are generally
2555 // not legal, and it is hard to see their values after they get legalized to
2556 // loads from a constant pool.
2557 case Intrinsic::arm_neon_vshifts:
2558 case Intrinsic::arm_neon_vshiftu:
2559 case Intrinsic::arm_neon_vshiftls:
2560 case Intrinsic::arm_neon_vshiftlu:
2561 case Intrinsic::arm_neon_vshiftn:
2562 case Intrinsic::arm_neon_vrshifts:
2563 case Intrinsic::arm_neon_vrshiftu:
2564 case Intrinsic::arm_neon_vrshiftn:
2565 case Intrinsic::arm_neon_vqshifts:
2566 case Intrinsic::arm_neon_vqshiftu:
2567 case Intrinsic::arm_neon_vqshiftsu:
2568 case Intrinsic::arm_neon_vqshiftns:
2569 case Intrinsic::arm_neon_vqshiftnu:
2570 case Intrinsic::arm_neon_vqshiftnsu:
2571 case Intrinsic::arm_neon_vqrshiftns:
2572 case Intrinsic::arm_neon_vqrshiftnu:
2573 case Intrinsic::arm_neon_vqrshiftnsu: {
2574 MVT VT = N->getOperand(1).getValueType();
2575 int64_t Cnt;
2576 unsigned VShiftOpc = 0;
2577
2578 switch (IntNo) {
2579 case Intrinsic::arm_neon_vshifts:
2580 case Intrinsic::arm_neon_vshiftu:
2581 if (isVShiftLImm(N->getOperand(2), VT, false, Cnt)) {
2582 VShiftOpc = ARMISD::VSHL;
2583 break;
2584 }
2585 if (isVShiftRImm(N->getOperand(2), VT, false, true, Cnt)) {
2586 VShiftOpc = (IntNo == Intrinsic::arm_neon_vshifts ?
2587 ARMISD::VSHRs : ARMISD::VSHRu);
2588 break;
2589 }
2590 return SDValue();
2591
2592 case Intrinsic::arm_neon_vshiftls:
2593 case Intrinsic::arm_neon_vshiftlu:
2594 if (isVShiftLImm(N->getOperand(2), VT, true, Cnt))
2595 break;
2596 assert(0 && "invalid shift count for vshll intrinsic");
2597 abort();
2598
2599 case Intrinsic::arm_neon_vrshifts:
2600 case Intrinsic::arm_neon_vrshiftu:
2601 if (isVShiftRImm(N->getOperand(2), VT, false, true, Cnt))
2602 break;
2603 return SDValue();
2604
2605 case Intrinsic::arm_neon_vqshifts:
2606 case Intrinsic::arm_neon_vqshiftu:
2607 if (isVShiftLImm(N->getOperand(2), VT, false, Cnt))
2608 break;
2609 return SDValue();
2610
2611 case Intrinsic::arm_neon_vqshiftsu:
2612 if (isVShiftLImm(N->getOperand(2), VT, false, Cnt))
2613 break;
2614 assert(0 && "invalid shift count for vqshlu intrinsic");
2615 abort();
2616
2617 case Intrinsic::arm_neon_vshiftn:
2618 case Intrinsic::arm_neon_vrshiftn:
2619 case Intrinsic::arm_neon_vqshiftns:
2620 case Intrinsic::arm_neon_vqshiftnu:
2621 case Intrinsic::arm_neon_vqshiftnsu:
2622 case Intrinsic::arm_neon_vqrshiftns:
2623 case Intrinsic::arm_neon_vqrshiftnu:
2624 case Intrinsic::arm_neon_vqrshiftnsu:
2625 // Narrowing shifts require an immediate right shift.
2626 if (isVShiftRImm(N->getOperand(2), VT, true, true, Cnt))
2627 break;
2628 assert(0 && "invalid shift count for narrowing vector shift intrinsic");
2629 abort();
2630
2631 default:
2632 assert(0 && "unhandled vector shift");
2633 }
2634
2635 switch (IntNo) {
2636 case Intrinsic::arm_neon_vshifts:
2637 case Intrinsic::arm_neon_vshiftu:
2638 // Opcode already set above.
2639 break;
2640 case Intrinsic::arm_neon_vshiftls:
2641 case Intrinsic::arm_neon_vshiftlu:
2642 if (Cnt == VT.getVectorElementType().getSizeInBits())
2643 VShiftOpc = ARMISD::VSHLLi;
2644 else
2645 VShiftOpc = (IntNo == Intrinsic::arm_neon_vshiftls ?
2646 ARMISD::VSHLLs : ARMISD::VSHLLu);
2647 break;
2648 case Intrinsic::arm_neon_vshiftn:
2649 VShiftOpc = ARMISD::VSHRN; break;
2650 case Intrinsic::arm_neon_vrshifts:
2651 VShiftOpc = ARMISD::VRSHRs; break;
2652 case Intrinsic::arm_neon_vrshiftu:
2653 VShiftOpc = ARMISD::VRSHRu; break;
2654 case Intrinsic::arm_neon_vrshiftn:
2655 VShiftOpc = ARMISD::VRSHRN; break;
2656 case Intrinsic::arm_neon_vqshifts:
2657 VShiftOpc = ARMISD::VQSHLs; break;
2658 case Intrinsic::arm_neon_vqshiftu:
2659 VShiftOpc = ARMISD::VQSHLu; break;
2660 case Intrinsic::arm_neon_vqshiftsu:
2661 VShiftOpc = ARMISD::VQSHLsu; break;
2662 case Intrinsic::arm_neon_vqshiftns:
2663 VShiftOpc = ARMISD::VQSHRNs; break;
2664 case Intrinsic::arm_neon_vqshiftnu:
2665 VShiftOpc = ARMISD::VQSHRNu; break;
2666 case Intrinsic::arm_neon_vqshiftnsu:
2667 VShiftOpc = ARMISD::VQSHRNsu; break;
2668 case Intrinsic::arm_neon_vqrshiftns:
2669 VShiftOpc = ARMISD::VQRSHRNs; break;
2670 case Intrinsic::arm_neon_vqrshiftnu:
2671 VShiftOpc = ARMISD::VQRSHRNu; break;
2672 case Intrinsic::arm_neon_vqrshiftnsu:
2673 VShiftOpc = ARMISD::VQRSHRNsu; break;
2674 }
2675
2676 return DAG.getNode(VShiftOpc, N->getDebugLoc(), N->getValueType(0),
2677 N->getOperand(1), DAG.getConstant(Cnt, MVT::i32));
2678 }
2679
2680 case Intrinsic::arm_neon_vshiftins: {
2681 MVT VT = N->getOperand(1).getValueType();
2682 int64_t Cnt;
2683 unsigned VShiftOpc = 0;
2684
2685 if (isVShiftLImm(N->getOperand(3), VT, false, Cnt))
2686 VShiftOpc = ARMISD::VSLI;
2687 else if (isVShiftRImm(N->getOperand(3), VT, false, true, Cnt))
2688 VShiftOpc = ARMISD::VSRI;
2689 else {
2690 assert(0 && "invalid shift count for vsli/vsri intrinsic");
2691 abort();
2692 }
2693
2694 return DAG.getNode(VShiftOpc, N->getDebugLoc(), N->getValueType(0),
2695 N->getOperand(1), N->getOperand(2),
2696 DAG.getConstant(Cnt, MVT::i32));
2697 }
2698
2699 case Intrinsic::arm_neon_vqrshifts:
2700 case Intrinsic::arm_neon_vqrshiftu:
2701 // No immediate versions of these to check for.
2702 break;
2703 }
2704
2705 return SDValue();
2706}
2707
2708/// PerformShiftCombine - Checks for immediate versions of vector shifts and
2709/// lowers them. As with the vector shift intrinsics, this is done during DAG
2710/// combining instead of DAG legalizing because the build_vectors for 64-bit
2711/// vector element shift counts are generally not legal, and it is hard to see
2712/// their values after they get legalized to loads from a constant pool.
2713static SDValue PerformShiftCombine(SDNode *N, SelectionDAG &DAG,
2714 const ARMSubtarget *ST) {
2715 MVT VT = N->getValueType(0);
2716
2717 // Nothing to be done for scalar shifts.
2718 if (! VT.isVector())
2719 return SDValue();
2720
2721 assert(ST->hasNEON() && "unexpected vector shift");
2722 int64_t Cnt;
2723
2724 switch (N->getOpcode()) {
2725 default: assert(0 && "unexpected shift opcode");
2726
2727 case ISD::SHL:
2728 if (isVShiftLImm(N->getOperand(1), VT, false, Cnt))
2729 return DAG.getNode(ARMISD::VSHL, N->getDebugLoc(), VT, N->getOperand(0),
2730 DAG.getConstant(Cnt, MVT::i32));
2731 break;
2732
2733 case ISD::SRA:
2734 case ISD::SRL:
2735 if (isVShiftRImm(N->getOperand(1), VT, false, false, Cnt)) {
2736 unsigned VShiftOpc = (N->getOpcode() == ISD::SRA ?
2737 ARMISD::VSHRs : ARMISD::VSHRu);
2738 return DAG.getNode(VShiftOpc, N->getDebugLoc(), VT, N->getOperand(0),
2739 DAG.getConstant(Cnt, MVT::i32));
2740 }
2741 }
2742 return SDValue();
2743}
2744
2745/// PerformExtendCombine - Target-specific DAG combining for ISD::SIGN_EXTEND,
2746/// ISD::ZERO_EXTEND, and ISD::ANY_EXTEND.
2747static SDValue PerformExtendCombine(SDNode *N, SelectionDAG &DAG,
2748 const ARMSubtarget *ST) {
2749 SDValue N0 = N->getOperand(0);
2750
2751 // Check for sign- and zero-extensions of vector extract operations of 8-
2752 // and 16-bit vector elements. NEON supports these directly. They are
2753 // handled during DAG combining because type legalization will promote them
2754 // to 32-bit types and it is messy to recognize the operations after that.
2755 if (ST->hasNEON() && N0.getOpcode() == ISD::EXTRACT_VECTOR_ELT) {
2756 SDValue Vec = N0.getOperand(0);
2757 SDValue Lane = N0.getOperand(1);
2758 MVT VT = N->getValueType(0);
2759 MVT EltVT = N0.getValueType();
2760 const TargetLowering &TLI = DAG.getTargetLoweringInfo();
2761
2762 if (VT == MVT::i32 &&
2763 (EltVT == MVT::i8 || EltVT == MVT::i16) &&
2764 TLI.isTypeLegal(Vec.getValueType())) {
2765
2766 unsigned Opc = 0;
2767 switch (N->getOpcode()) {
2768 default: assert(0 && "unexpected opcode");
2769 case ISD::SIGN_EXTEND:
2770 Opc = ARMISD::VGETLANEs;
2771 break;
2772 case ISD::ZERO_EXTEND:
2773 case ISD::ANY_EXTEND:
2774 Opc = ARMISD::VGETLANEu;
2775 break;
2776 }
2777 return DAG.getNode(Opc, N->getDebugLoc(), VT, Vec, Lane);
2778 }
2779 }
2780
2781 return SDValue();
2782}
2783
Dan Gohman475871a2008-07-27 21:46:04 +00002784SDValue ARMTargetLowering::PerformDAGCombine(SDNode *N,
Bob Wilson2dc4f542009-03-20 22:42:55 +00002785 DAGCombinerInfo &DCI) const {
Chris Lattnerf1b1c5e2007-11-27 22:36:16 +00002786 switch (N->getOpcode()) {
2787 default: break;
Chris Lattnerd1980a52009-03-12 06:52:53 +00002788 case ISD::ADD: return PerformADDCombine(N, DCI);
2789 case ISD::SUB: return PerformSUBCombine(N, DCI);
Chris Lattnerf1b1c5e2007-11-27 22:36:16 +00002790 case ARMISD::FMRRD: return PerformFMRRDCombine(N, DCI);
Bob Wilson5bafff32009-06-22 23:27:02 +00002791 case ISD::INTRINSIC_WO_CHAIN:
2792 return PerformIntrinsicCombine(N, DCI.DAG);
2793 case ISD::SHL:
2794 case ISD::SRA:
2795 case ISD::SRL:
2796 return PerformShiftCombine(N, DCI.DAG, Subtarget);
2797 case ISD::SIGN_EXTEND:
2798 case ISD::ZERO_EXTEND:
2799 case ISD::ANY_EXTEND:
2800 return PerformExtendCombine(N, DCI.DAG, Subtarget);
Chris Lattnerf1b1c5e2007-11-27 22:36:16 +00002801 }
Dan Gohman475871a2008-07-27 21:46:04 +00002802 return SDValue();
Chris Lattnerf1b1c5e2007-11-27 22:36:16 +00002803}
2804
Evan Chengb01fad62007-03-12 23:30:29 +00002805/// isLegalAddressImmediate - Return true if the integer value can be used
2806/// as the offset of the target addressing mode for load / store of the
2807/// given type.
Duncan Sands83ec4b62008-06-06 12:08:01 +00002808static bool isLegalAddressImmediate(int64_t V, MVT VT,
Chris Lattner37caf8c2007-04-09 23:33:39 +00002809 const ARMSubtarget *Subtarget) {
Evan Cheng961f8792007-03-13 20:37:59 +00002810 if (V == 0)
2811 return true;
2812
Evan Cheng65011532009-03-09 19:15:00 +00002813 if (!VT.isSimple())
2814 return false;
2815
Evan Chengb01fad62007-03-12 23:30:29 +00002816 if (Subtarget->isThumb()) {
2817 if (V < 0)
2818 return false;
2819
2820 unsigned Scale = 1;
Duncan Sands83ec4b62008-06-06 12:08:01 +00002821 switch (VT.getSimpleVT()) {
Evan Chengb01fad62007-03-12 23:30:29 +00002822 default: return false;
2823 case MVT::i1:
2824 case MVT::i8:
2825 // Scale == 1;
2826 break;
2827 case MVT::i16:
2828 // Scale == 2;
2829 Scale = 2;
2830 break;
2831 case MVT::i32:
2832 // Scale == 4;
2833 Scale = 4;
2834 break;
2835 }
2836
2837 if ((V & (Scale - 1)) != 0)
2838 return false;
2839 V /= Scale;
Anton Korobeynikov7c1c2612008-02-20 11:22:39 +00002840 return V == (V & ((1LL << 5) - 1));
Evan Chengb01fad62007-03-12 23:30:29 +00002841 }
2842
2843 if (V < 0)
2844 V = - V;
Duncan Sands83ec4b62008-06-06 12:08:01 +00002845 switch (VT.getSimpleVT()) {
Evan Chengb01fad62007-03-12 23:30:29 +00002846 default: return false;
2847 case MVT::i1:
2848 case MVT::i8:
2849 case MVT::i32:
2850 // +- imm12
Anton Korobeynikov7c1c2612008-02-20 11:22:39 +00002851 return V == (V & ((1LL << 12) - 1));
Evan Chengb01fad62007-03-12 23:30:29 +00002852 case MVT::i16:
2853 // +- imm8
Anton Korobeynikov7c1c2612008-02-20 11:22:39 +00002854 return V == (V & ((1LL << 8) - 1));
Evan Chengb01fad62007-03-12 23:30:29 +00002855 case MVT::f32:
2856 case MVT::f64:
2857 if (!Subtarget->hasVFP2())
2858 return false;
Evan Cheng0b0a9a92007-05-03 02:00:18 +00002859 if ((V & 3) != 0)
Evan Chengb01fad62007-03-12 23:30:29 +00002860 return false;
2861 V >>= 2;
Anton Korobeynikov7c1c2612008-02-20 11:22:39 +00002862 return V == (V & ((1LL << 8) - 1));
Evan Chengb01fad62007-03-12 23:30:29 +00002863 }
Evan Chenga8e29892007-01-19 07:51:42 +00002864}
2865
Chris Lattner37caf8c2007-04-09 23:33:39 +00002866/// isLegalAddressingMode - Return true if the addressing mode represented
2867/// by AM is legal for this target, for a load/store of the specified type.
Bob Wilson2dc4f542009-03-20 22:42:55 +00002868bool ARMTargetLowering::isLegalAddressingMode(const AddrMode &AM,
Chris Lattner37caf8c2007-04-09 23:33:39 +00002869 const Type *Ty) const {
Bob Wilson2c7dab12009-04-08 17:55:28 +00002870 MVT VT = getValueType(Ty, true);
2871 if (!isLegalAddressImmediate(AM.BaseOffs, VT, Subtarget))
Evan Chengb01fad62007-03-12 23:30:29 +00002872 return false;
Bob Wilson2dc4f542009-03-20 22:42:55 +00002873
Chris Lattner37caf8c2007-04-09 23:33:39 +00002874 // Can never fold addr of global into load/store.
Bob Wilson2dc4f542009-03-20 22:42:55 +00002875 if (AM.BaseGV)
Chris Lattner37caf8c2007-04-09 23:33:39 +00002876 return false;
Bob Wilson2dc4f542009-03-20 22:42:55 +00002877
Chris Lattner37caf8c2007-04-09 23:33:39 +00002878 switch (AM.Scale) {
2879 case 0: // no scale reg, must be "r+i" or "r", or "i".
2880 break;
2881 case 1:
2882 if (Subtarget->isThumb())
2883 return false;
Chris Lattner5a3d40d2007-04-13 06:50:55 +00002884 // FALL THROUGH.
Chris Lattner37caf8c2007-04-09 23:33:39 +00002885 default:
Chris Lattner5a3d40d2007-04-13 06:50:55 +00002886 // ARM doesn't support any R+R*scale+imm addr modes.
2887 if (AM.BaseOffs)
2888 return false;
Bob Wilson2dc4f542009-03-20 22:42:55 +00002889
Bob Wilson2c7dab12009-04-08 17:55:28 +00002890 if (!VT.isSimple())
2891 return false;
2892
Chris Lattnereb13d1b2007-04-10 03:48:29 +00002893 int Scale = AM.Scale;
Bob Wilson2c7dab12009-04-08 17:55:28 +00002894 switch (VT.getSimpleVT()) {
Chris Lattner37caf8c2007-04-09 23:33:39 +00002895 default: return false;
2896 case MVT::i1:
2897 case MVT::i8:
2898 case MVT::i32:
2899 case MVT::i64:
2900 // This assumes i64 is legalized to a pair of i32. If not (i.e.
2901 // ldrd / strd are used, then its address mode is same as i16.
2902 // r + r
Chris Lattnereb13d1b2007-04-10 03:48:29 +00002903 if (Scale < 0) Scale = -Scale;
2904 if (Scale == 1)
Chris Lattner37caf8c2007-04-09 23:33:39 +00002905 return true;
2906 // r + r << imm
Chris Lattnere1152942007-04-11 16:17:12 +00002907 return isPowerOf2_32(Scale & ~1);
Chris Lattner37caf8c2007-04-09 23:33:39 +00002908 case MVT::i16:
2909 // r + r
Chris Lattnereb13d1b2007-04-10 03:48:29 +00002910 if (((unsigned)AM.HasBaseReg + Scale) <= 2)
Chris Lattner37caf8c2007-04-09 23:33:39 +00002911 return true;
Chris Lattnere1152942007-04-11 16:17:12 +00002912 return false;
Bob Wilson2dc4f542009-03-20 22:42:55 +00002913
Chris Lattner37caf8c2007-04-09 23:33:39 +00002914 case MVT::isVoid:
2915 // Note, we allow "void" uses (basically, uses that aren't loads or
2916 // stores), because arm allows folding a scale into many arithmetic
2917 // operations. This should be made more precise and revisited later.
Bob Wilson2dc4f542009-03-20 22:42:55 +00002918
Chris Lattner37caf8c2007-04-09 23:33:39 +00002919 // Allow r << imm, but the imm has to be a multiple of two.
2920 if (AM.Scale & 1) return false;
2921 return isPowerOf2_32(AM.Scale);
2922 }
2923 break;
Evan Chengb01fad62007-03-12 23:30:29 +00002924 }
Chris Lattner37caf8c2007-04-09 23:33:39 +00002925 return true;
Evan Chengb01fad62007-03-12 23:30:29 +00002926}
2927
Evan Chenge88d5ce2009-07-02 07:28:31 +00002928static bool getARMIndexedAddressParts(SDNode *Ptr, MVT VT,
2929 bool isSEXTLoad, SDValue &Base,
2930 SDValue &Offset, bool &isInc,
2931 SelectionDAG &DAG) {
Evan Chenga8e29892007-01-19 07:51:42 +00002932 if (Ptr->getOpcode() != ISD::ADD && Ptr->getOpcode() != ISD::SUB)
2933 return false;
2934
2935 if (VT == MVT::i16 || ((VT == MVT::i8 || VT == MVT::i1) && isSEXTLoad)) {
2936 // AddressingMode 3
2937 Base = Ptr->getOperand(0);
2938 if (ConstantSDNode *RHS = dyn_cast<ConstantSDNode>(Ptr->getOperand(1))) {
Dan Gohmanf5aeb1a2008-09-12 16:56:44 +00002939 int RHSC = (int)RHS->getZExtValue();
Evan Chenga8e29892007-01-19 07:51:42 +00002940 if (RHSC < 0 && RHSC > -256) {
Evan Chenge88d5ce2009-07-02 07:28:31 +00002941 assert(Ptr->getOpcode() == ISD::ADD);
Evan Chenga8e29892007-01-19 07:51:42 +00002942 isInc = false;
2943 Offset = DAG.getConstant(-RHSC, RHS->getValueType(0));
2944 return true;
2945 }
2946 }
2947 isInc = (Ptr->getOpcode() == ISD::ADD);
2948 Offset = Ptr->getOperand(1);
2949 return true;
2950 } else if (VT == MVT::i32 || VT == MVT::i8 || VT == MVT::i1) {
2951 // AddressingMode 2
2952 if (ConstantSDNode *RHS = dyn_cast<ConstantSDNode>(Ptr->getOperand(1))) {
Dan Gohmanf5aeb1a2008-09-12 16:56:44 +00002953 int RHSC = (int)RHS->getZExtValue();
Evan Chenga8e29892007-01-19 07:51:42 +00002954 if (RHSC < 0 && RHSC > -0x1000) {
Evan Chenge88d5ce2009-07-02 07:28:31 +00002955 assert(Ptr->getOpcode() == ISD::ADD);
Evan Chenga8e29892007-01-19 07:51:42 +00002956 isInc = false;
2957 Offset = DAG.getConstant(-RHSC, RHS->getValueType(0));
2958 Base = Ptr->getOperand(0);
2959 return true;
2960 }
2961 }
2962
2963 if (Ptr->getOpcode() == ISD::ADD) {
2964 isInc = true;
2965 ARM_AM::ShiftOpc ShOpcVal= ARM_AM::getShiftOpcForNode(Ptr->getOperand(0));
2966 if (ShOpcVal != ARM_AM::no_shift) {
2967 Base = Ptr->getOperand(1);
2968 Offset = Ptr->getOperand(0);
2969 } else {
2970 Base = Ptr->getOperand(0);
2971 Offset = Ptr->getOperand(1);
2972 }
2973 return true;
2974 }
2975
2976 isInc = (Ptr->getOpcode() == ISD::ADD);
2977 Base = Ptr->getOperand(0);
2978 Offset = Ptr->getOperand(1);
2979 return true;
2980 }
2981
2982 // FIXME: Use FLDM / FSTM to emulate indexed FP load / store.
2983 return false;
2984}
2985
Evan Chenge88d5ce2009-07-02 07:28:31 +00002986static bool getT2IndexedAddressParts(SDNode *Ptr, MVT VT,
2987 bool isSEXTLoad, SDValue &Base,
2988 SDValue &Offset, bool &isInc,
2989 SelectionDAG &DAG) {
2990 if (Ptr->getOpcode() != ISD::ADD && Ptr->getOpcode() != ISD::SUB)
2991 return false;
2992
2993 Base = Ptr->getOperand(0);
2994 if (ConstantSDNode *RHS = dyn_cast<ConstantSDNode>(Ptr->getOperand(1))) {
2995 int RHSC = (int)RHS->getZExtValue();
2996 if (RHSC < 0 && RHSC > -0x100) { // 8 bits.
2997 assert(Ptr->getOpcode() == ISD::ADD);
2998 isInc = false;
2999 Offset = DAG.getConstant(-RHSC, RHS->getValueType(0));
3000 return true;
3001 } else if (RHSC > 0 && RHSC < 0x100) { // 8 bit, no zero.
3002 isInc = Ptr->getOpcode() == ISD::ADD;
3003 Offset = DAG.getConstant(RHSC, RHS->getValueType(0));
3004 return true;
3005 }
3006 }
3007
3008 return false;
3009}
3010
Evan Chenga8e29892007-01-19 07:51:42 +00003011/// getPreIndexedAddressParts - returns true by value, base pointer and
3012/// offset pointer and addressing mode by reference if the node's address
3013/// can be legally represented as pre-indexed load / store address.
3014bool
Dan Gohman475871a2008-07-27 21:46:04 +00003015ARMTargetLowering::getPreIndexedAddressParts(SDNode *N, SDValue &Base,
3016 SDValue &Offset,
Evan Chenga8e29892007-01-19 07:51:42 +00003017 ISD::MemIndexedMode &AM,
Dan Gohman73e09142009-01-15 16:29:45 +00003018 SelectionDAG &DAG) const {
Evan Chenge88d5ce2009-07-02 07:28:31 +00003019 if (Subtarget->isThumb1Only())
Evan Chenga8e29892007-01-19 07:51:42 +00003020 return false;
3021
Duncan Sands83ec4b62008-06-06 12:08:01 +00003022 MVT VT;
Dan Gohman475871a2008-07-27 21:46:04 +00003023 SDValue Ptr;
Evan Chenga8e29892007-01-19 07:51:42 +00003024 bool isSEXTLoad = false;
3025 if (LoadSDNode *LD = dyn_cast<LoadSDNode>(N)) {
3026 Ptr = LD->getBasePtr();
Dan Gohmanb625f2f2008-01-30 00:15:11 +00003027 VT = LD->getMemoryVT();
Evan Chenga8e29892007-01-19 07:51:42 +00003028 isSEXTLoad = LD->getExtensionType() == ISD::SEXTLOAD;
3029 } else if (StoreSDNode *ST = dyn_cast<StoreSDNode>(N)) {
3030 Ptr = ST->getBasePtr();
Dan Gohmanb625f2f2008-01-30 00:15:11 +00003031 VT = ST->getMemoryVT();
Evan Chenga8e29892007-01-19 07:51:42 +00003032 } else
3033 return false;
3034
3035 bool isInc;
Evan Chenge88d5ce2009-07-02 07:28:31 +00003036 bool isLegal = false;
3037 if (Subtarget->isThumb2())
3038 isLegal = getT2IndexedAddressParts(Ptr.getNode(), VT, isSEXTLoad, Base,
3039 Offset, isInc, DAG);
3040 else
3041 isLegal = getARMIndexedAddressParts(Ptr.getNode(), VT, isSEXTLoad, Base,
Evan Cheng04129572009-07-02 06:44:30 +00003042 Offset, isInc, DAG);
Evan Chenge88d5ce2009-07-02 07:28:31 +00003043 if (!isLegal)
3044 return false;
3045
3046 AM = isInc ? ISD::PRE_INC : ISD::PRE_DEC;
3047 return true;
Evan Chenga8e29892007-01-19 07:51:42 +00003048}
3049
3050/// getPostIndexedAddressParts - returns true by value, base pointer and
3051/// offset pointer and addressing mode by reference if this node can be
3052/// combined with a load / store to form a post-indexed load / store.
3053bool ARMTargetLowering::getPostIndexedAddressParts(SDNode *N, SDNode *Op,
Dan Gohman475871a2008-07-27 21:46:04 +00003054 SDValue &Base,
3055 SDValue &Offset,
Evan Chenga8e29892007-01-19 07:51:42 +00003056 ISD::MemIndexedMode &AM,
Dan Gohman73e09142009-01-15 16:29:45 +00003057 SelectionDAG &DAG) const {
Evan Chenge88d5ce2009-07-02 07:28:31 +00003058 if (Subtarget->isThumb1Only())
Evan Chenga8e29892007-01-19 07:51:42 +00003059 return false;
3060
Duncan Sands83ec4b62008-06-06 12:08:01 +00003061 MVT VT;
Dan Gohman475871a2008-07-27 21:46:04 +00003062 SDValue Ptr;
Evan Chenga8e29892007-01-19 07:51:42 +00003063 bool isSEXTLoad = false;
3064 if (LoadSDNode *LD = dyn_cast<LoadSDNode>(N)) {
Dan Gohmanb625f2f2008-01-30 00:15:11 +00003065 VT = LD->getMemoryVT();
Evan Chenga8e29892007-01-19 07:51:42 +00003066 isSEXTLoad = LD->getExtensionType() == ISD::SEXTLOAD;
3067 } else if (StoreSDNode *ST = dyn_cast<StoreSDNode>(N)) {
Dan Gohmanb625f2f2008-01-30 00:15:11 +00003068 VT = ST->getMemoryVT();
Evan Chenga8e29892007-01-19 07:51:42 +00003069 } else
3070 return false;
3071
3072 bool isInc;
Evan Chenge88d5ce2009-07-02 07:28:31 +00003073 bool isLegal = false;
3074 if (Subtarget->isThumb2())
3075 isLegal = getT2IndexedAddressParts(Op, VT, isSEXTLoad, Base, Offset,
Evan Chenga8e29892007-01-19 07:51:42 +00003076 isInc, DAG);
Evan Chenge88d5ce2009-07-02 07:28:31 +00003077 else
3078 isLegal = getARMIndexedAddressParts(Op, VT, isSEXTLoad, Base, Offset,
3079 isInc, DAG);
3080 if (!isLegal)
3081 return false;
3082
3083 AM = isInc ? ISD::POST_INC : ISD::POST_DEC;
3084 return true;
Evan Chenga8e29892007-01-19 07:51:42 +00003085}
3086
Dan Gohman475871a2008-07-27 21:46:04 +00003087void ARMTargetLowering::computeMaskedBitsForTargetNode(const SDValue Op,
Dan Gohman977a76f2008-02-13 22:28:48 +00003088 const APInt &Mask,
Bob Wilson2dc4f542009-03-20 22:42:55 +00003089 APInt &KnownZero,
Dan Gohmanfd29e0e2008-02-13 00:35:47 +00003090 APInt &KnownOne,
Dan Gohmanea859be2007-06-22 14:59:07 +00003091 const SelectionDAG &DAG,
Evan Chenga8e29892007-01-19 07:51:42 +00003092 unsigned Depth) const {
Dan Gohmanfd29e0e2008-02-13 00:35:47 +00003093 KnownZero = KnownOne = APInt(Mask.getBitWidth(), 0);
Evan Chenga8e29892007-01-19 07:51:42 +00003094 switch (Op.getOpcode()) {
3095 default: break;
3096 case ARMISD::CMOV: {
3097 // Bits are known zero/one if known on the LHS and RHS.
Dan Gohmanea859be2007-06-22 14:59:07 +00003098 DAG.ComputeMaskedBits(Op.getOperand(0), Mask, KnownZero, KnownOne, Depth+1);
Evan Chenga8e29892007-01-19 07:51:42 +00003099 if (KnownZero == 0 && KnownOne == 0) return;
3100
Dan Gohmanfd29e0e2008-02-13 00:35:47 +00003101 APInt KnownZeroRHS, KnownOneRHS;
Dan Gohmanea859be2007-06-22 14:59:07 +00003102 DAG.ComputeMaskedBits(Op.getOperand(1), Mask,
3103 KnownZeroRHS, KnownOneRHS, Depth+1);
Evan Chenga8e29892007-01-19 07:51:42 +00003104 KnownZero &= KnownZeroRHS;
3105 KnownOne &= KnownOneRHS;
3106 return;
3107 }
3108 }
3109}
3110
3111//===----------------------------------------------------------------------===//
3112// ARM Inline Assembly Support
3113//===----------------------------------------------------------------------===//
3114
3115/// getConstraintType - Given a constraint letter, return the type of
3116/// constraint it is for this target.
3117ARMTargetLowering::ConstraintType
Chris Lattner4234f572007-03-25 02:14:49 +00003118ARMTargetLowering::getConstraintType(const std::string &Constraint) const {
3119 if (Constraint.size() == 1) {
3120 switch (Constraint[0]) {
3121 default: break;
3122 case 'l': return C_RegisterClass;
Chris Lattnerc4e3f8e2007-04-02 17:24:08 +00003123 case 'w': return C_RegisterClass;
Chris Lattner4234f572007-03-25 02:14:49 +00003124 }
Evan Chenga8e29892007-01-19 07:51:42 +00003125 }
Chris Lattner4234f572007-03-25 02:14:49 +00003126 return TargetLowering::getConstraintType(Constraint);
Evan Chenga8e29892007-01-19 07:51:42 +00003127}
3128
Bob Wilson2dc4f542009-03-20 22:42:55 +00003129std::pair<unsigned, const TargetRegisterClass*>
Evan Chenga8e29892007-01-19 07:51:42 +00003130ARMTargetLowering::getRegForInlineAsmConstraint(const std::string &Constraint,
Duncan Sands83ec4b62008-06-06 12:08:01 +00003131 MVT VT) const {
Evan Chenga8e29892007-01-19 07:51:42 +00003132 if (Constraint.size() == 1) {
3133 // GCC RS6000 Constraint Letters
3134 switch (Constraint[0]) {
Chris Lattnerc4e3f8e2007-04-02 17:24:08 +00003135 case 'l':
Jim Grosbach30eae3c2009-04-07 20:34:09 +00003136 if (Subtarget->isThumb())
3137 return std::make_pair(0U, ARM::tGPRRegisterClass);
3138 else
3139 return std::make_pair(0U, ARM::GPRRegisterClass);
Chris Lattnerc4e3f8e2007-04-02 17:24:08 +00003140 case 'r':
3141 return std::make_pair(0U, ARM::GPRRegisterClass);
3142 case 'w':
3143 if (VT == MVT::f32)
3144 return std::make_pair(0U, ARM::SPRRegisterClass);
Evan Cheng0a7baa22007-04-04 00:06:07 +00003145 if (VT == MVT::f64)
Chris Lattnerc4e3f8e2007-04-02 17:24:08 +00003146 return std::make_pair(0U, ARM::DPRRegisterClass);
3147 break;
Evan Chenga8e29892007-01-19 07:51:42 +00003148 }
3149 }
3150 return TargetLowering::getRegForInlineAsmConstraint(Constraint, VT);
3151}
3152
3153std::vector<unsigned> ARMTargetLowering::
3154getRegClassForInlineAsmConstraint(const std::string &Constraint,
Duncan Sands83ec4b62008-06-06 12:08:01 +00003155 MVT VT) const {
Evan Chenga8e29892007-01-19 07:51:42 +00003156 if (Constraint.size() != 1)
3157 return std::vector<unsigned>();
3158
3159 switch (Constraint[0]) { // GCC ARM Constraint Letters
3160 default: break;
3161 case 'l':
Jim Grosbach30eae3c2009-04-07 20:34:09 +00003162 return make_vector<unsigned>(ARM::R0, ARM::R1, ARM::R2, ARM::R3,
3163 ARM::R4, ARM::R5, ARM::R6, ARM::R7,
3164 0);
Evan Chenga8e29892007-01-19 07:51:42 +00003165 case 'r':
3166 return make_vector<unsigned>(ARM::R0, ARM::R1, ARM::R2, ARM::R3,
3167 ARM::R4, ARM::R5, ARM::R6, ARM::R7,
3168 ARM::R8, ARM::R9, ARM::R10, ARM::R11,
3169 ARM::R12, ARM::LR, 0);
Chris Lattnerc4e3f8e2007-04-02 17:24:08 +00003170 case 'w':
3171 if (VT == MVT::f32)
3172 return make_vector<unsigned>(ARM::S0, ARM::S1, ARM::S2, ARM::S3,
3173 ARM::S4, ARM::S5, ARM::S6, ARM::S7,
3174 ARM::S8, ARM::S9, ARM::S10, ARM::S11,
3175 ARM::S12,ARM::S13,ARM::S14,ARM::S15,
3176 ARM::S16,ARM::S17,ARM::S18,ARM::S19,
3177 ARM::S20,ARM::S21,ARM::S22,ARM::S23,
3178 ARM::S24,ARM::S25,ARM::S26,ARM::S27,
3179 ARM::S28,ARM::S29,ARM::S30,ARM::S31, 0);
3180 if (VT == MVT::f64)
3181 return make_vector<unsigned>(ARM::D0, ARM::D1, ARM::D2, ARM::D3,
3182 ARM::D4, ARM::D5, ARM::D6, ARM::D7,
3183 ARM::D8, ARM::D9, ARM::D10,ARM::D11,
3184 ARM::D12,ARM::D13,ARM::D14,ARM::D15, 0);
3185 break;
Evan Chenga8e29892007-01-19 07:51:42 +00003186 }
3187
3188 return std::vector<unsigned>();
3189}
Bob Wilsonbf6396b2009-04-01 17:58:54 +00003190
3191/// LowerAsmOperandForConstraint - Lower the specified operand into the Ops
3192/// vector. If it is invalid, don't add anything to Ops.
3193void ARMTargetLowering::LowerAsmOperandForConstraint(SDValue Op,
3194 char Constraint,
3195 bool hasMemory,
3196 std::vector<SDValue>&Ops,
3197 SelectionDAG &DAG) const {
3198 SDValue Result(0, 0);
3199
3200 switch (Constraint) {
3201 default: break;
3202 case 'I': case 'J': case 'K': case 'L':
3203 case 'M': case 'N': case 'O':
3204 ConstantSDNode *C = dyn_cast<ConstantSDNode>(Op);
3205 if (!C)
3206 return;
3207
3208 int64_t CVal64 = C->getSExtValue();
3209 int CVal = (int) CVal64;
3210 // None of these constraints allow values larger than 32 bits. Check
3211 // that the value fits in an int.
3212 if (CVal != CVal64)
3213 return;
3214
3215 switch (Constraint) {
3216 case 'I':
3217 if (Subtarget->isThumb()) {
3218 // This must be a constant between 0 and 255, for ADD immediates.
3219 if (CVal >= 0 && CVal <= 255)
3220 break;
3221 } else {
3222 // A constant that can be used as an immediate value in a
3223 // data-processing instruction.
3224 if (ARM_AM::getSOImmVal(CVal) != -1)
3225 break;
3226 }
3227 return;
3228
3229 case 'J':
3230 if (Subtarget->isThumb()) {
3231 // This must be a constant between -255 and -1, for negated ADD
3232 // immediates. This can be used in GCC with an "n" modifier that
3233 // prints the negated value, for use with SUB instructions. It is
3234 // not useful otherwise but is implemented for compatibility.
3235 if (CVal >= -255 && CVal <= -1)
3236 break;
3237 } else {
3238 // This must be a constant between -4095 and 4095. It is not clear
3239 // what this constraint is intended for. Implemented for
3240 // compatibility with GCC.
3241 if (CVal >= -4095 && CVal <= 4095)
3242 break;
3243 }
3244 return;
3245
3246 case 'K':
3247 if (Subtarget->isThumb()) {
3248 // A 32-bit value where only one byte has a nonzero value. Exclude
3249 // zero to match GCC. This constraint is used by GCC internally for
3250 // constants that can be loaded with a move/shift combination.
3251 // It is not useful otherwise but is implemented for compatibility.
3252 if (CVal != 0 && ARM_AM::isThumbImmShiftedVal(CVal))
3253 break;
3254 } else {
3255 // A constant whose bitwise inverse can be used as an immediate
3256 // value in a data-processing instruction. This can be used in GCC
3257 // with a "B" modifier that prints the inverted value, for use with
3258 // BIC and MVN instructions. It is not useful otherwise but is
3259 // implemented for compatibility.
3260 if (ARM_AM::getSOImmVal(~CVal) != -1)
3261 break;
3262 }
3263 return;
3264
3265 case 'L':
3266 if (Subtarget->isThumb()) {
3267 // This must be a constant between -7 and 7,
3268 // for 3-operand ADD/SUB immediate instructions.
3269 if (CVal >= -7 && CVal < 7)
3270 break;
3271 } else {
3272 // A constant whose negation can be used as an immediate value in a
3273 // data-processing instruction. This can be used in GCC with an "n"
3274 // modifier that prints the negated value, for use with SUB
3275 // instructions. It is not useful otherwise but is implemented for
3276 // compatibility.
3277 if (ARM_AM::getSOImmVal(-CVal) != -1)
3278 break;
3279 }
3280 return;
3281
3282 case 'M':
3283 if (Subtarget->isThumb()) {
3284 // This must be a multiple of 4 between 0 and 1020, for
3285 // ADD sp + immediate.
3286 if ((CVal >= 0 && CVal <= 1020) && ((CVal & 3) == 0))
3287 break;
3288 } else {
3289 // A power of two or a constant between 0 and 32. This is used in
3290 // GCC for the shift amount on shifted register operands, but it is
3291 // useful in general for any shift amounts.
3292 if ((CVal >= 0 && CVal <= 32) || ((CVal & (CVal - 1)) == 0))
3293 break;
3294 }
3295 return;
3296
3297 case 'N':
3298 if (Subtarget->isThumb()) {
3299 // This must be a constant between 0 and 31, for shift amounts.
3300 if (CVal >= 0 && CVal <= 31)
3301 break;
3302 }
3303 return;
3304
3305 case 'O':
3306 if (Subtarget->isThumb()) {
3307 // This must be a multiple of 4 between -508 and 508, for
3308 // ADD/SUB sp = sp + immediate.
3309 if ((CVal >= -508 && CVal <= 508) && ((CVal & 3) == 0))
3310 break;
3311 }
3312 return;
3313 }
3314 Result = DAG.getTargetConstant(CVal, Op.getValueType());
3315 break;
3316 }
3317
3318 if (Result.getNode()) {
3319 Ops.push_back(Result);
3320 return;
3321 }
3322 return TargetLowering::LowerAsmOperandForConstraint(Op, Constraint, hasMemory,
3323 Ops, DAG);
3324}