Blame - lib/Target/PowerPC/PPCISelLowering.cpp - fp2-dev/platform/external/llvm

blob: c6885cf7b8a4b54cef863d6e79e4f9ee7dafe315 [file] [log] [blame]

Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1	//===-- PPCISelLowering.cpp - PPC DAG Lowering Implementation -------------===//
				2	//
				3	// The LLVM Compiler Infrastructure
				4	//
Chris Lattner	081ce94	2007-12-29 20:36:04 +0000	[diff] [blame]	5	// This file is distributed under the University of Illinois Open Source
				6	// License. See LICENSE.TXT for details.
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	7	//
				8	//===----------------------------------------------------------------------===//
				9	//
				10	// This file implements the PPCISelLowering class.
				11	//
				12	//===----------------------------------------------------------------------===//
				13
				14	#include "PPCISelLowering.h"
				15	#include "PPCMachineFunctionInfo.h"
				16	#include "PPCPredicates.h"
				17	#include "PPCTargetMachine.h"
				18	#include "PPCPerfectShuffle.h"
Owen Anderson	1636de9	2007-09-07 04:06:50 +0000	[diff] [blame]	19	#include "llvm/ADT/STLExtras.h"
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	20	#include "llvm/ADT/VectorExtras.h"
				21	#include "llvm/Analysis/ScalarEvolutionExpressions.h"
				22	#include "llvm/CodeGen/CallingConvLower.h"
				23	#include "llvm/CodeGen/MachineFrameInfo.h"
				24	#include "llvm/CodeGen/MachineFunction.h"
				25	#include "llvm/CodeGen/MachineInstrBuilder.h"
Chris Lattner	1b98919	2007-12-31 04:13:23 +0000	[diff] [blame]	26	#include "llvm/CodeGen/MachineRegisterInfo.h"
Dan Gohman	12a9c08	2008-02-06 22:27:42 +0000	[diff] [blame]	27	#include "llvm/CodeGen/PseudoSourceValue.h"
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	28	#include "llvm/CodeGen/SelectionDAG.h"
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	29	#include "llvm/Constants.h"
				30	#include "llvm/Function.h"
				31	#include "llvm/Intrinsics.h"
				32	#include "llvm/Support/MathExtras.h"
				33	#include "llvm/Target/TargetOptions.h"
				34	#include "llvm/Support/CommandLine.h"
				35	using namespace llvm;
				36
				37	static cl::opt<bool> EnablePPCPreinc("enable-ppc-preinc",
				38	cl::desc("enable preincrement load/store generation on PPC (experimental)"),
				39	cl::Hidden);
				40
				41	PPCTargetLowering::PPCTargetLowering(PPCTargetMachine &TM)
				42	: TargetLowering(TM), PPCSubTarget(*TM.getSubtargetImpl()) {
				43
				44	setPow2DivIsCheap();
				45
				46	// Use _setjmp/_longjmp instead of setjmp/longjmp.
				47	setUseUnderscoreSetJmp(true);
				48	setUseUnderscoreLongJmp(true);
				49
				50	// Set up the register classes.
				51	addRegisterClass(MVT::i32, PPC::GPRCRegisterClass);
				52	addRegisterClass(MVT::f32, PPC::F4RCRegisterClass);
				53	addRegisterClass(MVT::f64, PPC::F8RCRegisterClass);
				54
				55	// PowerPC has an i16 but no i8 (or i1) SEXTLOAD
Duncan Sands	082524c	2008-01-23 20:39:46 +0000	[diff] [blame]	56	setLoadXAction(ISD::SEXTLOAD, MVT::i1, Promote);
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	57	setLoadXAction(ISD::SEXTLOAD, MVT::i8, Expand);
Duncan Sands	082524c	2008-01-23 20:39:46 +0000	[diff] [blame]	58
Chris Lattner	3bc0850	2008-01-17 19:59:44 +0000	[diff] [blame]	59	setTruncStoreAction(MVT::f64, MVT::f32, Expand);
				60
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	61	// PowerPC has pre-inc load and store's.
				62	setIndexedLoadAction(ISD::PRE_INC, MVT::i1, Legal);
				63	setIndexedLoadAction(ISD::PRE_INC, MVT::i8, Legal);
				64	setIndexedLoadAction(ISD::PRE_INC, MVT::i16, Legal);
				65	setIndexedLoadAction(ISD::PRE_INC, MVT::i32, Legal);
				66	setIndexedLoadAction(ISD::PRE_INC, MVT::i64, Legal);
				67	setIndexedStoreAction(ISD::PRE_INC, MVT::i1, Legal);
				68	setIndexedStoreAction(ISD::PRE_INC, MVT::i8, Legal);
				69	setIndexedStoreAction(ISD::PRE_INC, MVT::i16, Legal);
				70	setIndexedStoreAction(ISD::PRE_INC, MVT::i32, Legal);
				71	setIndexedStoreAction(ISD::PRE_INC, MVT::i64, Legal);
				72
Dale Johannesen	472d15d	2007-10-06 01:24:11 +0000	[diff] [blame]	73	// Shortening conversions involving ppcf128 get expanded (2 regs -> 1 reg)
				74	setConvertAction(MVT::ppcf128, MVT::f64, Expand);
				75	setConvertAction(MVT::ppcf128, MVT::f32, Expand);
Dale Johannesen	3d8578b	2007-10-10 01:01:31 +0000	[diff] [blame]	76	// This is used in the ppcf128->int sequence. Note it has different semantics
				77	// from FP_ROUND: that rounds to nearest, this rounds to zero.
				78	setOperationAction(ISD::FP_ROUND_INREG, MVT::ppcf128, Custom);
Dale Johannesen	472d15d	2007-10-06 01:24:11 +0000	[diff] [blame]	79
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	80	// PowerPC has no intrinsics for these particular operations
				81	setOperationAction(ISD::MEMMOVE, MVT::Other, Expand);
				82	setOperationAction(ISD::MEMSET, MVT::Other, Expand);
				83	setOperationAction(ISD::MEMCPY, MVT::Other, Expand);
Andrew Lenharth	0531ec5	2008-02-16 14:46:26 +0000	[diff] [blame]	84	setOperationAction(ISD::MEMBARRIER, MVT::Other, Expand);
				85
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	86	// PowerPC has no SREM/UREM instructions
				87	setOperationAction(ISD::SREM, MVT::i32, Expand);
				88	setOperationAction(ISD::UREM, MVT::i32, Expand);
				89	setOperationAction(ISD::SREM, MVT::i64, Expand);
				90	setOperationAction(ISD::UREM, MVT::i64, Expand);
Dan Gohman	c9130bb	2007-10-08 17:28:24 +0000	[diff] [blame]	91
				92	// Don't use SMUL_LOHI/UMUL_LOHI or SDIVREM/UDIVREM to lower SREM/UREM.
				93	setOperationAction(ISD::UMUL_LOHI, MVT::i32, Expand);
				94	setOperationAction(ISD::SMUL_LOHI, MVT::i32, Expand);
				95	setOperationAction(ISD::UMUL_LOHI, MVT::i64, Expand);
				96	setOperationAction(ISD::SMUL_LOHI, MVT::i64, Expand);
				97	setOperationAction(ISD::UDIVREM, MVT::i32, Expand);
				98	setOperationAction(ISD::SDIVREM, MVT::i32, Expand);
				99	setOperationAction(ISD::UDIVREM, MVT::i64, Expand);
				100	setOperationAction(ISD::SDIVREM, MVT::i64, Expand);
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	101
Dan Gohman	2f7b198	2007-10-11 23:21:31 +0000	[diff] [blame]	102	// We don't support sin/cos/sqrt/fmod/pow
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	103	setOperationAction(ISD::FSIN , MVT::f64, Expand);
				104	setOperationAction(ISD::FCOS , MVT::f64, Expand);
				105	setOperationAction(ISD::FREM , MVT::f64, Expand);
Dan Gohman	2f7b198	2007-10-11 23:21:31 +0000	[diff] [blame]	106	setOperationAction(ISD::FPOW , MVT::f64, Expand);
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	107	setOperationAction(ISD::FSIN , MVT::f32, Expand);
				108	setOperationAction(ISD::FCOS , MVT::f32, Expand);
				109	setOperationAction(ISD::FREM , MVT::f32, Expand);
Dan Gohman	2f7b198	2007-10-11 23:21:31 +0000	[diff] [blame]	110	setOperationAction(ISD::FPOW , MVT::f32, Expand);
Dale Johannesen	436e380	2008-01-18 19:55:37 +0000	[diff] [blame]	111
Dan Gohman	819574c	2008-01-31 00:41:03 +0000	[diff] [blame]	112	setOperationAction(ISD::FLT_ROUNDS_, MVT::i32, Custom);
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	113
				114	// If we're enabling GP optimizations, use hardware square root
				115	if (!TM.getSubtarget<PPCSubtarget>().hasFSQRT()) {
				116	setOperationAction(ISD::FSQRT, MVT::f64, Expand);
				117	setOperationAction(ISD::FSQRT, MVT::f32, Expand);
				118	}
				119
				120	setOperationAction(ISD::FCOPYSIGN, MVT::f64, Expand);
				121	setOperationAction(ISD::FCOPYSIGN, MVT::f32, Expand);
				122
				123	// PowerPC does not have BSWAP, CTPOP or CTTZ
				124	setOperationAction(ISD::BSWAP, MVT::i32 , Expand);
				125	setOperationAction(ISD::CTPOP, MVT::i32 , Expand);
				126	setOperationAction(ISD::CTTZ , MVT::i32 , Expand);
				127	setOperationAction(ISD::BSWAP, MVT::i64 , Expand);
				128	setOperationAction(ISD::CTPOP, MVT::i64 , Expand);
				129	setOperationAction(ISD::CTTZ , MVT::i64 , Expand);
				130
				131	// PowerPC does not have ROTR
				132	setOperationAction(ISD::ROTR, MVT::i32 , Expand);
				133
				134	// PowerPC does not have Select
				135	setOperationAction(ISD::SELECT, MVT::i32, Expand);
				136	setOperationAction(ISD::SELECT, MVT::i64, Expand);
				137	setOperationAction(ISD::SELECT, MVT::f32, Expand);
				138	setOperationAction(ISD::SELECT, MVT::f64, Expand);
				139
				140	// PowerPC wants to turn select_cc of FP into fsel when possible.
				141	setOperationAction(ISD::SELECT_CC, MVT::f32, Custom);
				142	setOperationAction(ISD::SELECT_CC, MVT::f64, Custom);
				143
				144	// PowerPC wants to optimize integer setcc a bit
				145	setOperationAction(ISD::SETCC, MVT::i32, Custom);
				146
				147	// PowerPC does not have BRCOND which requires SetCC
				148	setOperationAction(ISD::BRCOND, MVT::Other, Expand);
				149
				150	setOperationAction(ISD::BR_JT, MVT::Other, Expand);
				151
				152	// PowerPC turns FP_TO_SINT into FCTIWZ and some load/stores.
				153	setOperationAction(ISD::FP_TO_SINT, MVT::i32, Custom);
				154
				155	// PowerPC does not have [U\|S]INT_TO_FP
				156	setOperationAction(ISD::SINT_TO_FP, MVT::i32, Expand);
				157	setOperationAction(ISD::UINT_TO_FP, MVT::i32, Expand);
				158
				159	setOperationAction(ISD::BIT_CONVERT, MVT::f32, Expand);
				160	setOperationAction(ISD::BIT_CONVERT, MVT::i32, Expand);
				161	setOperationAction(ISD::BIT_CONVERT, MVT::i64, Expand);
				162	setOperationAction(ISD::BIT_CONVERT, MVT::f64, Expand);
				163
				164	// We cannot sextinreg(i1). Expand to shifts.
				165	setOperationAction(ISD::SIGN_EXTEND_INREG, MVT::i1, Expand);
				166
				167	// Support label based line numbers.
				168	setOperationAction(ISD::LOCATION, MVT::Other, Expand);
				169	setOperationAction(ISD::DEBUG_LOC, MVT::Other, Expand);
Nicolas Geoffray	6186476	2007-12-21 12:19:44 +0000	[diff] [blame]	170
				171	setOperationAction(ISD::EXCEPTIONADDR, MVT::i64, Expand);
				172	setOperationAction(ISD::EHSELECTION, MVT::i64, Expand);
				173	setOperationAction(ISD::EXCEPTIONADDR, MVT::i32, Expand);
				174	setOperationAction(ISD::EHSELECTION, MVT::i32, Expand);
				175
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	176
				177	// We want to legalize GlobalAddress and ConstantPool nodes into the
				178	// appropriate instructions to materialize the address.
				179	setOperationAction(ISD::GlobalAddress, MVT::i32, Custom);
				180	setOperationAction(ISD::GlobalTLSAddress, MVT::i32, Custom);
				181	setOperationAction(ISD::ConstantPool, MVT::i32, Custom);
				182	setOperationAction(ISD::JumpTable, MVT::i32, Custom);
				183	setOperationAction(ISD::GlobalAddress, MVT::i64, Custom);
				184	setOperationAction(ISD::GlobalTLSAddress, MVT::i64, Custom);
				185	setOperationAction(ISD::ConstantPool, MVT::i64, Custom);
				186	setOperationAction(ISD::JumpTable, MVT::i64, Custom);
				187
				188	// RET must be custom lowered, to meet ABI requirements
				189	setOperationAction(ISD::RET , MVT::Other, Custom);
Duncan Sands	38947cd	2007-07-27 12:58:54 +0000	[diff] [blame]	190
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	191	// VASTART needs to be custom lowered to use the VarArgsFrameIndex
				192	setOperationAction(ISD::VASTART , MVT::Other, Custom);
				193
				194	// VAARG is custom lowered with ELF 32 ABI
				195	if (TM.getSubtarget<PPCSubtarget>().isELF32_ABI())
				196	setOperationAction(ISD::VAARG, MVT::Other, Custom);
				197	else
				198	setOperationAction(ISD::VAARG, MVT::Other, Expand);
				199
				200	// Use the default implementation.
				201	setOperationAction(ISD::VACOPY , MVT::Other, Expand);
				202	setOperationAction(ISD::VAEND , MVT::Other, Expand);
				203	setOperationAction(ISD::STACKSAVE , MVT::Other, Expand);
				204	setOperationAction(ISD::STACKRESTORE , MVT::Other, Custom);
				205	setOperationAction(ISD::DYNAMIC_STACKALLOC, MVT::i32 , Custom);
				206	setOperationAction(ISD::DYNAMIC_STACKALLOC, MVT::i64 , Custom);
				207
				208	// We want to custom lower some of our intrinsics.
				209	setOperationAction(ISD::INTRINSIC_WO_CHAIN, MVT::Other, Custom);
				210
				211	if (TM.getSubtarget<PPCSubtarget>().has64BitSupport()) {
				212	// They also have instructions for converting between i64 and fp.
				213	setOperationAction(ISD::FP_TO_SINT, MVT::i64, Custom);
				214	setOperationAction(ISD::FP_TO_UINT, MVT::i64, Expand);
				215	setOperationAction(ISD::SINT_TO_FP, MVT::i64, Custom);
				216	setOperationAction(ISD::UINT_TO_FP, MVT::i64, Expand);
				217	setOperationAction(ISD::FP_TO_UINT, MVT::i32, Expand);
				218
				219	// FIXME: disable this lowered code. This generates 64-bit register values,
				220	// and we don't model the fact that the top part is clobbered by calls. We
				221	// need to flag these together so that the value isn't live across a call.
				222	//setOperationAction(ISD::SINT_TO_FP, MVT::i32, Custom);
				223
				224	// To take advantage of the above i64 FP_TO_SINT, promote i32 FP_TO_UINT
				225	setOperationAction(ISD::FP_TO_UINT, MVT::i32, Promote);
				226	} else {
				227	// PowerPC does not have FP_TO_UINT on 32-bit implementations.
				228	setOperationAction(ISD::FP_TO_UINT, MVT::i32, Expand);
				229	}
				230
				231	if (TM.getSubtarget<PPCSubtarget>().use64BitRegs()) {
Chris Lattner	c882caf	2007-10-19 04:08:28 +0000	[diff] [blame]	232	// 64-bit PowerPC implementations can support i64 types directly
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	233	addRegisterClass(MVT::i64, PPC::G8RCRegisterClass);
				234	// BUILD_PAIR can't be handled natively, and should be expanded to shl/or
				235	setOperationAction(ISD::BUILD_PAIR, MVT::i64, Expand);
Dan Gohman	71619ec	2008-03-07 20:36:53 +0000	[diff] [blame]	236	// 64-bit PowerPC wants to expand i128 shifts itself.
				237	setOperationAction(ISD::SHL_PARTS, MVT::i64, Custom);
				238	setOperationAction(ISD::SRA_PARTS, MVT::i64, Custom);
				239	setOperationAction(ISD::SRL_PARTS, MVT::i64, Custom);
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	240	} else {
Chris Lattner	c882caf	2007-10-19 04:08:28 +0000	[diff] [blame]	241	// 32-bit PowerPC wants to expand i64 shifts itself.
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	242	setOperationAction(ISD::SHL_PARTS, MVT::i32, Custom);
				243	setOperationAction(ISD::SRA_PARTS, MVT::i32, Custom);
				244	setOperationAction(ISD::SRL_PARTS, MVT::i32, Custom);
				245	}
				246
				247	if (TM.getSubtarget<PPCSubtarget>().hasAltivec()) {
				248	// First set operation action for all vector types to expand. Then we
				249	// will selectively turn on ones that can be effectively codegen'd.
				250	for (unsigned VT = (unsigned)MVT::FIRST_VECTOR_VALUETYPE;
				251	VT <= (unsigned)MVT::LAST_VECTOR_VALUETYPE; ++VT) {
				252	// add/sub are legal for all supported vector VT's.
				253	setOperationAction(ISD::ADD , (MVT::ValueType)VT, Legal);
				254	setOperationAction(ISD::SUB , (MVT::ValueType)VT, Legal);
				255
				256	// We promote all shuffles to v16i8.
				257	setOperationAction(ISD::VECTOR_SHUFFLE, (MVT::ValueType)VT, Promote);
				258	AddPromotedToType (ISD::VECTOR_SHUFFLE, (MVT::ValueType)VT, MVT::v16i8);
				259
				260	// We promote all non-typed operations to v4i32.
				261	setOperationAction(ISD::AND , (MVT::ValueType)VT, Promote);
				262	AddPromotedToType (ISD::AND , (MVT::ValueType)VT, MVT::v4i32);
				263	setOperationAction(ISD::OR , (MVT::ValueType)VT, Promote);
				264	AddPromotedToType (ISD::OR , (MVT::ValueType)VT, MVT::v4i32);
				265	setOperationAction(ISD::XOR , (MVT::ValueType)VT, Promote);
				266	AddPromotedToType (ISD::XOR , (MVT::ValueType)VT, MVT::v4i32);
				267	setOperationAction(ISD::LOAD , (MVT::ValueType)VT, Promote);
				268	AddPromotedToType (ISD::LOAD , (MVT::ValueType)VT, MVT::v4i32);
				269	setOperationAction(ISD::SELECT, (MVT::ValueType)VT, Promote);
				270	AddPromotedToType (ISD::SELECT, (MVT::ValueType)VT, MVT::v4i32);
				271	setOperationAction(ISD::STORE, (MVT::ValueType)VT, Promote);
				272	AddPromotedToType (ISD::STORE, (MVT::ValueType)VT, MVT::v4i32);
				273
				274	// No other operations are legal.
				275	setOperationAction(ISD::MUL , (MVT::ValueType)VT, Expand);
				276	setOperationAction(ISD::SDIV, (MVT::ValueType)VT, Expand);
				277	setOperationAction(ISD::SREM, (MVT::ValueType)VT, Expand);
				278	setOperationAction(ISD::UDIV, (MVT::ValueType)VT, Expand);
				279	setOperationAction(ISD::UREM, (MVT::ValueType)VT, Expand);
				280	setOperationAction(ISD::FDIV, (MVT::ValueType)VT, Expand);
Evan Cheng	c5912e3	2007-07-30 07:51:22 +0000	[diff] [blame]	281	setOperationAction(ISD::FNEG, (MVT::ValueType)VT, Expand);
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	282	setOperationAction(ISD::EXTRACT_VECTOR_ELT, (MVT::ValueType)VT, Expand);
				283	setOperationAction(ISD::INSERT_VECTOR_ELT, (MVT::ValueType)VT, Expand);
				284	setOperationAction(ISD::BUILD_VECTOR, (MVT::ValueType)VT, Expand);
Dan Gohman	c9130bb	2007-10-08 17:28:24 +0000	[diff] [blame]	285	setOperationAction(ISD::UMUL_LOHI, (MVT::ValueType)VT, Expand);
				286	setOperationAction(ISD::SMUL_LOHI, (MVT::ValueType)VT, Expand);
				287	setOperationAction(ISD::UDIVREM, (MVT::ValueType)VT, Expand);
				288	setOperationAction(ISD::SDIVREM, (MVT::ValueType)VT, Expand);
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	289	setOperationAction(ISD::SCALAR_TO_VECTOR, (MVT::ValueType)VT, Expand);
Dan Gohman	4e22ac4	2007-10-12 14:08:57 +0000	[diff] [blame]	290	setOperationAction(ISD::FPOW, (MVT::ValueType)VT, Expand);
				291	setOperationAction(ISD::CTPOP, (MVT::ValueType)VT, Expand);
				292	setOperationAction(ISD::CTLZ, (MVT::ValueType)VT, Expand);
				293	setOperationAction(ISD::CTTZ, (MVT::ValueType)VT, Expand);
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	294	}
				295
				296	// We can custom expand all VECTOR_SHUFFLEs to VPERM, others we can handle
				297	// with merges, splats, etc.
				298	setOperationAction(ISD::VECTOR_SHUFFLE, MVT::v16i8, Custom);
				299
				300	setOperationAction(ISD::AND , MVT::v4i32, Legal);
				301	setOperationAction(ISD::OR , MVT::v4i32, Legal);
				302	setOperationAction(ISD::XOR , MVT::v4i32, Legal);
				303	setOperationAction(ISD::LOAD , MVT::v4i32, Legal);
				304	setOperationAction(ISD::SELECT, MVT::v4i32, Expand);
				305	setOperationAction(ISD::STORE , MVT::v4i32, Legal);
				306
				307	addRegisterClass(MVT::v4f32, PPC::VRRCRegisterClass);
				308	addRegisterClass(MVT::v4i32, PPC::VRRCRegisterClass);
				309	addRegisterClass(MVT::v8i16, PPC::VRRCRegisterClass);
				310	addRegisterClass(MVT::v16i8, PPC::VRRCRegisterClass);
				311
				312	setOperationAction(ISD::MUL, MVT::v4f32, Legal);
				313	setOperationAction(ISD::MUL, MVT::v4i32, Custom);
				314	setOperationAction(ISD::MUL, MVT::v8i16, Custom);
				315	setOperationAction(ISD::MUL, MVT::v16i8, Custom);
				316
				317	setOperationAction(ISD::SCALAR_TO_VECTOR, MVT::v4f32, Custom);
				318	setOperationAction(ISD::SCALAR_TO_VECTOR, MVT::v4i32, Custom);
				319
				320	setOperationAction(ISD::BUILD_VECTOR, MVT::v16i8, Custom);
				321	setOperationAction(ISD::BUILD_VECTOR, MVT::v8i16, Custom);
				322	setOperationAction(ISD::BUILD_VECTOR, MVT::v4i32, Custom);
				323	setOperationAction(ISD::BUILD_VECTOR, MVT::v4f32, Custom);
				324	}
				325
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	326	setShiftAmountType(MVT::i32);
				327	setSetCCResultContents(ZeroOrOneSetCCResult);
				328
				329	if (TM.getSubtarget<PPCSubtarget>().isPPC64()) {
				330	setStackPointerRegisterToSaveRestore(PPC::X1);
				331	setExceptionPointerRegister(PPC::X3);
				332	setExceptionSelectorRegister(PPC::X4);
				333	} else {
				334	setStackPointerRegisterToSaveRestore(PPC::R1);
				335	setExceptionPointerRegister(PPC::R3);
				336	setExceptionSelectorRegister(PPC::R4);
				337	}
				338
				339	// We have target-specific dag combine patterns for the following nodes:
				340	setTargetDAGCombine(ISD::SINT_TO_FP);
				341	setTargetDAGCombine(ISD::STORE);
				342	setTargetDAGCombine(ISD::BR_CC);
				343	setTargetDAGCombine(ISD::BSWAP);
				344
Dale Johannesen	6f3c7bf	2007-10-19 00:59:18 +0000	[diff] [blame]	345	// Darwin long double math library functions have $LDBL128 appended.
				346	if (TM.getSubtarget<PPCSubtarget>().isDarwin()) {
Duncan Sands	37a3f47	2008-01-10 10:28:30 +0000	[diff] [blame]	347	setLibcallName(RTLIB::COS_PPCF128, "cosl$LDBL128");
Dale Johannesen	6f3c7bf	2007-10-19 00:59:18 +0000	[diff] [blame]	348	setLibcallName(RTLIB::POW_PPCF128, "powl$LDBL128");
				349	setLibcallName(RTLIB::REM_PPCF128, "fmodl$LDBL128");
Duncan Sands	37a3f47	2008-01-10 10:28:30 +0000	[diff] [blame]	350	setLibcallName(RTLIB::SIN_PPCF128, "sinl$LDBL128");
				351	setLibcallName(RTLIB::SQRT_PPCF128, "sqrtl$LDBL128");
Dale Johannesen	6f3c7bf	2007-10-19 00:59:18 +0000	[diff] [blame]	352	}
				353
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	354	computeRegisterProperties();
				355	}
				356
Dale Johannesen	88945f8	2008-02-28 22:31:51 +0000	[diff] [blame]	357	/// getByValTypeAlignment - Return the desired alignment for ByVal aggregate
				358	/// function arguments in the caller parameter area.
				359	unsigned PPCTargetLowering::getByValTypeAlignment(const Type *Ty) const {
				360	TargetMachine &TM = getTargetMachine();
				361	// Darwin passes everything on 4 byte boundary.
				362	if (TM.getSubtarget<PPCSubtarget>().isDarwin())
				363	return 4;
				364	// FIXME Elf TBD
				365	return 4;
				366	}
				367
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	368	const char *PPCTargetLowering::getTargetNodeName(unsigned Opcode) const {
				369	switch (Opcode) {
				370	default: return 0;
				371	case PPCISD::FSEL: return "PPCISD::FSEL";
				372	case PPCISD::FCFID: return "PPCISD::FCFID";
				373	case PPCISD::FCTIDZ: return "PPCISD::FCTIDZ";
				374	case PPCISD::FCTIWZ: return "PPCISD::FCTIWZ";
				375	case PPCISD::STFIWX: return "PPCISD::STFIWX";
				376	case PPCISD::VMADDFP: return "PPCISD::VMADDFP";
				377	case PPCISD::VNMSUBFP: return "PPCISD::VNMSUBFP";
				378	case PPCISD::VPERM: return "PPCISD::VPERM";
				379	case PPCISD::Hi: return "PPCISD::Hi";
				380	case PPCISD::Lo: return "PPCISD::Lo";
				381	case PPCISD::DYNALLOC: return "PPCISD::DYNALLOC";
				382	case PPCISD::GlobalBaseReg: return "PPCISD::GlobalBaseReg";
				383	case PPCISD::SRL: return "PPCISD::SRL";
				384	case PPCISD::SRA: return "PPCISD::SRA";
				385	case PPCISD::SHL: return "PPCISD::SHL";
				386	case PPCISD::EXTSW_32: return "PPCISD::EXTSW_32";
				387	case PPCISD::STD_32: return "PPCISD::STD_32";
				388	case PPCISD::CALL_ELF: return "PPCISD::CALL_ELF";
				389	case PPCISD::CALL_Macho: return "PPCISD::CALL_Macho";
				390	case PPCISD::MTCTR: return "PPCISD::MTCTR";
				391	case PPCISD::BCTRL_Macho: return "PPCISD::BCTRL_Macho";
				392	case PPCISD::BCTRL_ELF: return "PPCISD::BCTRL_ELF";
				393	case PPCISD::RET_FLAG: return "PPCISD::RET_FLAG";
				394	case PPCISD::MFCR: return "PPCISD::MFCR";
				395	case PPCISD::VCMP: return "PPCISD::VCMP";
				396	case PPCISD::VCMPo: return "PPCISD::VCMPo";
				397	case PPCISD::LBRX: return "PPCISD::LBRX";
				398	case PPCISD::STBRX: return "PPCISD::STBRX";
				399	case PPCISD::COND_BRANCH: return "PPCISD::COND_BRANCH";
Chris Lattner	e2a6e9f	2008-01-18 18:51:16 +0000	[diff] [blame]	400	case PPCISD::MFFS: return "PPCISD::MFFS";
				401	case PPCISD::MTFSB0: return "PPCISD::MTFSB0";
				402	case PPCISD::MTFSB1: return "PPCISD::MTFSB1";
				403	case PPCISD::FADDRTZ: return "PPCISD::FADDRTZ";
				404	case PPCISD::MTFSF: return "PPCISD::MTFSF";
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	405	}
				406	}
				407
Scott Michel	502151f	2008-03-10 15:42:14 +0000	[diff] [blame]	408
				409	MVT::ValueType
				410	PPCTargetLowering::getSetCCResultType(const SDOperand &) const {
				411	return MVT::i32;
				412	}
				413
				414
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	415	//===----------------------------------------------------------------------===//
				416	// Node matching predicates, for use by the tblgen matching code.
				417	//===----------------------------------------------------------------------===//
				418
				419	/// isFloatingPointZero - Return true if this is 0.0 or -0.0.
				420	static bool isFloatingPointZero(SDOperand Op) {
				421	if (ConstantFPSDNode *CFP = dyn_cast<ConstantFPSDNode>(Op))
Dale Johannesen	df8a831	2007-08-31 04:03:46 +0000	[diff] [blame]	422	return CFP->getValueAPF().isZero();
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	423	else if (ISD::isEXTLoad(Op.Val) \|\| ISD::isNON_EXTLoad(Op.Val)) {
				424	// Maybe this has already been legalized into the constant pool?
				425	if (ConstantPoolSDNode *CP = dyn_cast<ConstantPoolSDNode>(Op.getOperand(1)))
				426	if (ConstantFP *CFP = dyn_cast<ConstantFP>(CP->getConstVal()))
Dale Johannesen	df8a831	2007-08-31 04:03:46 +0000	[diff] [blame]	427	return CFP->getValueAPF().isZero();
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	428	}
				429	return false;
				430	}
				431
				432	/// isConstantOrUndef - Op is either an undef node or a ConstantSDNode. Return
				433	/// true if Op is undef or if it matches the specified value.
				434	static bool isConstantOrUndef(SDOperand Op, unsigned Val) {
				435	return Op.getOpcode() == ISD::UNDEF \|\|
				436	cast<ConstantSDNode>(Op)->getValue() == Val;
				437	}
				438
				439	/// isVPKUHUMShuffleMask - Return true if this is the shuffle mask for a
				440	/// VPKUHUM instruction.
				441	bool PPC::isVPKUHUMShuffleMask(SDNode *N, bool isUnary) {
				442	if (!isUnary) {
				443	for (unsigned i = 0; i != 16; ++i)
				444	if (!isConstantOrUndef(N->getOperand(i), i*2+1))
				445	return false;
				446	} else {
				447	for (unsigned i = 0; i != 8; ++i)
				448	if (!isConstantOrUndef(N->getOperand(i), i*2+1) \|\|
				449	!isConstantOrUndef(N->getOperand(i+8), i*2+1))
				450	return false;
				451	}
				452	return true;
				453	}
				454
				455	/// isVPKUWUMShuffleMask - Return true if this is the shuffle mask for a
				456	/// VPKUWUM instruction.
				457	bool PPC::isVPKUWUMShuffleMask(SDNode *N, bool isUnary) {
				458	if (!isUnary) {
				459	for (unsigned i = 0; i != 16; i += 2)
				460	if (!isConstantOrUndef(N->getOperand(i ), i*2+2) \|\|
				461	!isConstantOrUndef(N->getOperand(i+1), i*2+3))
				462	return false;
				463	} else {
				464	for (unsigned i = 0; i != 8; i += 2)
				465	if (!isConstantOrUndef(N->getOperand(i ), i*2+2) \|\|
				466	!isConstantOrUndef(N->getOperand(i+1), i*2+3) \|\|
				467	!isConstantOrUndef(N->getOperand(i+8), i*2+2) \|\|
				468	!isConstantOrUndef(N->getOperand(i+9), i*2+3))
				469	return false;
				470	}
				471	return true;
				472	}
				473
				474	/// isVMerge - Common function, used to match vmrg* shuffles.
				475	///
				476	static bool isVMerge(SDNode *N, unsigned UnitSize,
				477	unsigned LHSStart, unsigned RHSStart) {
				478	assert(N->getOpcode() == ISD::BUILD_VECTOR &&
				479	N->getNumOperands() == 16 && "PPC only supports shuffles by bytes!");
				480	assert((UnitSize == 1 \|\| UnitSize == 2 \|\| UnitSize == 4) &&
				481	"Unsupported merge size!");
				482
				483	for (unsigned i = 0; i != 8/UnitSize; ++i) // Step over units
				484	for (unsigned j = 0; j != UnitSize; ++j) { // Step over bytes within unit
				485	if (!isConstantOrUndef(N->getOperand(iUnitSize2+j),
				486	LHSStart+j+i*UnitSize) \|\|
				487	!isConstantOrUndef(N->getOperand(iUnitSize2+UnitSize+j),
				488	RHSStart+j+i*UnitSize))
				489	return false;
				490	}
				491	return true;
				492	}
				493
				494	/// isVMRGLShuffleMask - Return true if this is a shuffle mask suitable for
				495	/// a VRGL* instruction with the specified unit size (1,2 or 4 bytes).
				496	bool PPC::isVMRGLShuffleMask(SDNode *N, unsigned UnitSize, bool isUnary) {
				497	if (!isUnary)
				498	return isVMerge(N, UnitSize, 8, 24);
				499	return isVMerge(N, UnitSize, 8, 8);
				500	}
				501
				502	/// isVMRGHShuffleMask - Return true if this is a shuffle mask suitable for
				503	/// a VRGH* instruction with the specified unit size (1,2 or 4 bytes).
				504	bool PPC::isVMRGHShuffleMask(SDNode *N, unsigned UnitSize, bool isUnary) {
				505	if (!isUnary)
				506	return isVMerge(N, UnitSize, 0, 16);
				507	return isVMerge(N, UnitSize, 0, 0);
				508	}
				509
				510
				511	/// isVSLDOIShuffleMask - If this is a vsldoi shuffle mask, return the shift
				512	/// amount, otherwise return -1.
				513	int PPC::isVSLDOIShuffleMask(SDNode *N, bool isUnary) {
				514	assert(N->getOpcode() == ISD::BUILD_VECTOR &&
				515	N->getNumOperands() == 16 && "PPC only supports shuffles by bytes!");
				516	// Find the first non-undef value in the shuffle mask.
				517	unsigned i;
				518	for (i = 0; i != 16 && N->getOperand(i).getOpcode() == ISD::UNDEF; ++i)
				519	/search/;
				520
				521	if (i == 16) return -1; // all undef.
				522
				523	// Otherwise, check to see if the rest of the elements are consequtively
				524	// numbered from this value.
				525	unsigned ShiftAmt = cast<ConstantSDNode>(N->getOperand(i))->getValue();
				526	if (ShiftAmt < i) return -1;
				527	ShiftAmt -= i;
				528
				529	if (!isUnary) {
				530	// Check the rest of the elements to see if they are consequtive.
				531	for (++i; i != 16; ++i)
				532	if (!isConstantOrUndef(N->getOperand(i), ShiftAmt+i))
				533	return -1;
				534	} else {
				535	// Check the rest of the elements to see if they are consequtive.
				536	for (++i; i != 16; ++i)
				537	if (!isConstantOrUndef(N->getOperand(i), (ShiftAmt+i) & 15))
				538	return -1;
				539	}
				540
				541	return ShiftAmt;
				542	}
				543
				544	/// isSplatShuffleMask - Return true if the specified VECTOR_SHUFFLE operand
				545	/// specifies a splat of a single element that is suitable for input to
				546	/// VSPLTB/VSPLTH/VSPLTW.
				547	bool PPC::isSplatShuffleMask(SDNode *N, unsigned EltSize) {
				548	assert(N->getOpcode() == ISD::BUILD_VECTOR &&
				549	N->getNumOperands() == 16 &&
				550	(EltSize == 1 \|\| EltSize == 2 \|\| EltSize == 4));
				551
				552	// This is a splat operation if each element of the permute is the same, and
				553	// if the value doesn't reference the second vector.
				554	unsigned ElementBase = 0;
				555	SDOperand Elt = N->getOperand(0);
				556	if (ConstantSDNode *EltV = dyn_cast<ConstantSDNode>(Elt))
				557	ElementBase = EltV->getValue();
				558	else
				559	return false; // FIXME: Handle UNDEF elements too!
				560
				561	if (cast<ConstantSDNode>(Elt)->getValue() >= 16)
				562	return false;
				563
				564	// Check that they are consequtive.
				565	for (unsigned i = 1; i != EltSize; ++i) {
				566	if (!isa<ConstantSDNode>(N->getOperand(i)) \|\|
				567	cast<ConstantSDNode>(N->getOperand(i))->getValue() != i+ElementBase)
				568	return false;
				569	}
				570
				571	assert(isa<ConstantSDNode>(Elt) && "Invalid VECTOR_SHUFFLE mask!");
				572	for (unsigned i = EltSize, e = 16; i != e; i += EltSize) {
				573	if (N->getOperand(i).getOpcode() == ISD::UNDEF) continue;
				574	assert(isa<ConstantSDNode>(N->getOperand(i)) &&
				575	"Invalid VECTOR_SHUFFLE mask!");
				576	for (unsigned j = 0; j != EltSize; ++j)
				577	if (N->getOperand(i+j) != N->getOperand(j))
				578	return false;
				579	}
				580
				581	return true;
				582	}
				583
Evan Cheng	c5912e3	2007-07-30 07:51:22 +0000	[diff] [blame]	584	/// isAllNegativeZeroVector - Returns true if all elements of build_vector
				585	/// are -0.0.
				586	bool PPC::isAllNegativeZeroVector(SDNode *N) {
				587	assert(N->getOpcode() == ISD::BUILD_VECTOR);
				588	if (PPC::isSplatShuffleMask(N, N->getNumOperands()))
				589	if (ConstantFPSDNode *CFP = dyn_cast<ConstantFPSDNode>(N))
Dale Johannesen	df8a831	2007-08-31 04:03:46 +0000	[diff] [blame]	590	return CFP->getValueAPF().isNegZero();
Evan Cheng	c5912e3	2007-07-30 07:51:22 +0000	[diff] [blame]	591	return false;
				592	}
				593
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	594	/// getVSPLTImmediate - Return the appropriate VSPLT* immediate to splat the
				595	/// specified isSplatShuffleMask VECTOR_SHUFFLE mask.
				596	unsigned PPC::getVSPLTImmediate(SDNode *N, unsigned EltSize) {
				597	assert(isSplatShuffleMask(N, EltSize));
				598	return cast<ConstantSDNode>(N->getOperand(0))->getValue() / EltSize;
				599	}
				600
				601	/// get_VSPLTI_elt - If this is a build_vector of constants which can be formed
				602	/// by using a vspltis[bhw] instruction of the specified element size, return
				603	/// the constant being splatted. The ByteSize field indicates the number of
				604	/// bytes of each element [124] -> [bhw].
				605	SDOperand PPC::get_VSPLTI_elt(SDNode *N, unsigned ByteSize, SelectionDAG &DAG) {
				606	SDOperand OpVal(0, 0);
				607
				608	// If ByteSize of the splat is bigger than the element size of the
				609	// build_vector, then we have a case where we are checking for a splat where
				610	// multiple elements of the buildvector are folded together into a single
				611	// logical element of the splat (e.g. "vsplish 1" to splat {0,1}*8).
				612	unsigned EltSize = 16/N->getNumOperands();
				613	if (EltSize < ByteSize) {
				614	unsigned Multiple = ByteSize/EltSize; // Number of BV entries per spltval.
				615	SDOperand UniquedVals[4];
				616	assert(Multiple > 1 && Multiple <= 4 && "How can this happen?");
				617
				618	// See if all of the elements in the buildvector agree across.
				619	for (unsigned i = 0, e = N->getNumOperands(); i != e; ++i) {
				620	if (N->getOperand(i).getOpcode() == ISD::UNDEF) continue;
				621	// If the element isn't a constant, bail fully out.
				622	if (!isa<ConstantSDNode>(N->getOperand(i))) return SDOperand();
				623
				624
				625	if (UniquedVals[i&(Multiple-1)].Val == 0)
				626	UniquedVals[i&(Multiple-1)] = N->getOperand(i);
				627	else if (UniquedVals[i&(Multiple-1)] != N->getOperand(i))
				628	return SDOperand(); // no match.
				629	}
				630
				631	// Okay, if we reached this point, UniquedVals[0..Multiple-1] contains
				632	// either constant or undef values that are identical for each chunk. See
				633	// if these chunks can form into a larger vspltis*.
				634
				635	// Check to see if all of the leading entries are either 0 or -1. If
				636	// neither, then this won't fit into the immediate field.
				637	bool LeadingZero = true;
				638	bool LeadingOnes = true;
				639	for (unsigned i = 0; i != Multiple-1; ++i) {
				640	if (UniquedVals[i].Val == 0) continue; // Must have been undefs.
				641
				642	LeadingZero &= cast<ConstantSDNode>(UniquedVals[i])->isNullValue();
				643	LeadingOnes &= cast<ConstantSDNode>(UniquedVals[i])->isAllOnesValue();
				644	}
				645	// Finally, check the least significant entry.
				646	if (LeadingZero) {
				647	if (UniquedVals[Multiple-1].Val == 0)
				648	return DAG.getTargetConstant(0, MVT::i32); // 0,0,0,undef
				649	int Val = cast<ConstantSDNode>(UniquedVals[Multiple-1])->getValue();
				650	if (Val < 16)
				651	return DAG.getTargetConstant(Val, MVT::i32); // 0,0,0,4 -> vspltisw(4)
				652	}
				653	if (LeadingOnes) {
				654	if (UniquedVals[Multiple-1].Val == 0)
				655	return DAG.getTargetConstant(~0U, MVT::i32); // -1,-1,-1,undef
				656	int Val =cast<ConstantSDNode>(UniquedVals[Multiple-1])->getSignExtended();
				657	if (Val >= -16) // -1,-1,-1,-2 -> vspltisw(-2)
				658	return DAG.getTargetConstant(Val, MVT::i32);
				659	}
				660
				661	return SDOperand();
				662	}
				663
				664	// Check to see if this buildvec has a single non-undef value in its elements.
				665	for (unsigned i = 0, e = N->getNumOperands(); i != e; ++i) {
				666	if (N->getOperand(i).getOpcode() == ISD::UNDEF) continue;
				667	if (OpVal.Val == 0)
				668	OpVal = N->getOperand(i);
				669	else if (OpVal != N->getOperand(i))
				670	return SDOperand();
				671	}
				672
				673	if (OpVal.Val == 0) return SDOperand(); // All UNDEF: use implicit def.
				674
				675	unsigned ValSizeInBytes = 0;
				676	uint64_t Value = 0;
				677	if (ConstantSDNode *CN = dyn_cast<ConstantSDNode>(OpVal)) {
				678	Value = CN->getValue();
				679	ValSizeInBytes = MVT::getSizeInBits(CN->getValueType(0))/8;
				680	} else if (ConstantFPSDNode *CN = dyn_cast<ConstantFPSDNode>(OpVal)) {
				681	assert(CN->getValueType(0) == MVT::f32 && "Only one legal FP vector type!");
Dale Johannesen	df8a831	2007-08-31 04:03:46 +0000	[diff] [blame]	682	Value = FloatToBits(CN->getValueAPF().convertToFloat());
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	683	ValSizeInBytes = 4;
				684	}
				685
				686	// If the splat value is larger than the element value, then we can never do
				687	// this splat. The only case that we could fit the replicated bits into our
				688	// immediate field for would be zero, and we prefer to use vxor for it.
				689	if (ValSizeInBytes < ByteSize) return SDOperand();
				690
				691	// If the element value is larger than the splat value, cut it in half and
				692	// check to see if the two halves are equal. Continue doing this until we
				693	// get to ByteSize. This allows us to handle 0x01010101 as 0x01.
				694	while (ValSizeInBytes > ByteSize) {
				695	ValSizeInBytes >>= 1;
				696
				697	// If the top half equals the bottom half, we're still ok.
				698	if (((Value >> (ValSizeInBytes8)) & ((1 << (8ValSizeInBytes))-1)) !=
				699	(Value & ((1 << (8*ValSizeInBytes))-1)))
				700	return SDOperand();
				701	}
				702
				703	// Properly sign extend the value.
				704	int ShAmt = (4-ByteSize)*8;
				705	int MaskVal = ((int)Value << ShAmt) >> ShAmt;
				706
				707	// If this is zero, don't match, zero matches ISD::isBuildVectorAllZeros.
				708	if (MaskVal == 0) return SDOperand();
				709
				710	// Finally, if this value fits in a 5 bit sext field, return it
				711	if (((MaskVal << (32-5)) >> (32-5)) == MaskVal)
				712	return DAG.getTargetConstant(MaskVal, MVT::i32);
				713	return SDOperand();
				714	}
				715
				716	//===----------------------------------------------------------------------===//
				717	// Addressing Mode Selection
				718	//===----------------------------------------------------------------------===//
				719
				720	/// isIntS16Immediate - This method tests to see if the node is either a 32-bit
				721	/// or 64-bit immediate, and if the value can be accurately represented as a
				722	/// sign extension from a 16-bit value. If so, this returns true and the
				723	/// immediate.
				724	static bool isIntS16Immediate(SDNode *N, short &Imm) {
				725	if (N->getOpcode() != ISD::Constant)
				726	return false;
				727
				728	Imm = (short)cast<ConstantSDNode>(N)->getValue();
				729	if (N->getValueType(0) == MVT::i32)
				730	return Imm == (int32_t)cast<ConstantSDNode>(N)->getValue();
				731	else
				732	return Imm == (int64_t)cast<ConstantSDNode>(N)->getValue();
				733	}
				734	static bool isIntS16Immediate(SDOperand Op, short &Imm) {
				735	return isIntS16Immediate(Op.Val, Imm);
				736	}
				737
				738
				739	/// SelectAddressRegReg - Given the specified addressed, check to see if it
				740	/// can be represented as an indexed [r+r] operation. Returns false if it
				741	/// can be more efficiently represented with [r+imm].
				742	bool PPCTargetLowering::SelectAddressRegReg(SDOperand N, SDOperand &Base,
				743	SDOperand &Index,
				744	SelectionDAG &DAG) {
				745	short imm = 0;
				746	if (N.getOpcode() == ISD::ADD) {
				747	if (isIntS16Immediate(N.getOperand(1), imm))
				748	return false; // r+i
				749	if (N.getOperand(1).getOpcode() == PPCISD::Lo)
				750	return false; // r+i
				751
				752	Base = N.getOperand(0);
				753	Index = N.getOperand(1);
				754	return true;
				755	} else if (N.getOpcode() == ISD::OR) {
				756	if (isIntS16Immediate(N.getOperand(1), imm))
				757	return false; // r+i can fold it if we can.
				758
				759	// If this is an or of disjoint bitfields, we can codegen this as an add
				760	// (for better address arithmetic) if the LHS and RHS of the OR are provably
				761	// disjoint.
Dan Gohman	63f4e46	2008-02-27 01:23:58 +0000	[diff] [blame]	762	APInt LHSKnownZero, LHSKnownOne;
				763	APInt RHSKnownZero, RHSKnownOne;
				764	DAG.ComputeMaskedBits(N.getOperand(0),
Dan Gohman	c9cd46f	2008-02-27 21:12:32 +0000	[diff] [blame]	765	APInt::getAllOnesValue(N.getOperand(0)
				766	.getValueSizeInBits()),
Dan Gohman	63f4e46	2008-02-27 01:23:58 +0000	[diff] [blame]	767	LHSKnownZero, LHSKnownOne);
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	768
Dan Gohman	63f4e46	2008-02-27 01:23:58 +0000	[diff] [blame]	769	if (LHSKnownZero.getBoolValue()) {
				770	DAG.ComputeMaskedBits(N.getOperand(1),
Dan Gohman	c9cd46f	2008-02-27 21:12:32 +0000	[diff] [blame]	771	APInt::getAllOnesValue(N.getOperand(1)
				772	.getValueSizeInBits()),
Dan Gohman	63f4e46	2008-02-27 01:23:58 +0000	[diff] [blame]	773	RHSKnownZero, RHSKnownOne);
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	774	// If all of the bits are known zero on the LHS or RHS, the add won't
				775	// carry.
Dan Gohman	c9cd46f	2008-02-27 21:12:32 +0000	[diff] [blame]	776	if (~(LHSKnownZero \| RHSKnownZero) == 0) {
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	777	Base = N.getOperand(0);
				778	Index = N.getOperand(1);
				779	return true;
				780	}
				781	}
				782	}
				783
				784	return false;
				785	}
				786
				787	/// Returns true if the address N can be represented by a base register plus
				788	/// a signed 16-bit displacement [r+imm], and if it is not better
				789	/// represented as reg+reg.
				790	bool PPCTargetLowering::SelectAddressRegImm(SDOperand N, SDOperand &Disp,
				791	SDOperand &Base, SelectionDAG &DAG){
				792	// If this can be more profitably realized as r+r, fail.
				793	if (SelectAddressRegReg(N, Disp, Base, DAG))
				794	return false;
				795
				796	if (N.getOpcode() == ISD::ADD) {
				797	short imm = 0;
				798	if (isIntS16Immediate(N.getOperand(1), imm)) {
				799	Disp = DAG.getTargetConstant((int)imm & 0xFFFF, MVT::i32);
				800	if (FrameIndexSDNode *FI = dyn_cast<FrameIndexSDNode>(N.getOperand(0))) {
				801	Base = DAG.getTargetFrameIndex(FI->getIndex(), N.getValueType());
				802	} else {
				803	Base = N.getOperand(0);
				804	}
				805	return true; // [r+i]
				806	} else if (N.getOperand(1).getOpcode() == PPCISD::Lo) {
				807	// Match LOAD (ADD (X, Lo(G))).
				808	assert(!cast<ConstantSDNode>(N.getOperand(1).getOperand(1))->getValue()
				809	&& "Cannot handle constant offsets yet!");
				810	Disp = N.getOperand(1).getOperand(0); // The global address.
				811	assert(Disp.getOpcode() == ISD::TargetGlobalAddress \|\|
				812	Disp.getOpcode() == ISD::TargetConstantPool \|\|
				813	Disp.getOpcode() == ISD::TargetJumpTable);
				814	Base = N.getOperand(0);
				815	return true; // [&g+r]
				816	}
				817	} else if (N.getOpcode() == ISD::OR) {
				818	short imm = 0;
				819	if (isIntS16Immediate(N.getOperand(1), imm)) {
				820	// If this is an or of disjoint bitfields, we can codegen this as an add
				821	// (for better address arithmetic) if the LHS and RHS of the OR are
				822	// provably disjoint.
Dan Gohman	63f4e46	2008-02-27 01:23:58 +0000	[diff] [blame]	823	APInt LHSKnownZero, LHSKnownOne;
				824	DAG.ComputeMaskedBits(N.getOperand(0),
				825	APInt::getAllOnesValue(32),
				826	LHSKnownZero, LHSKnownOne);
				827	if ((LHSKnownZero.getZExtValue()\|~(uint64_t)imm) == ~0ULL) {
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	828	// If all of the bits are known zero on the LHS or RHS, the add won't
				829	// carry.
				830	Base = N.getOperand(0);
				831	Disp = DAG.getTargetConstant((int)imm & 0xFFFF, MVT::i32);
				832	return true;
				833	}
				834	}
				835	} else if (ConstantSDNode *CN = dyn_cast<ConstantSDNode>(N)) {
				836	// Loading from a constant address.
				837
				838	// If this address fits entirely in a 16-bit sext immediate field, codegen
				839	// this as "d, 0"
				840	short Imm;
				841	if (isIntS16Immediate(CN, Imm)) {
				842	Disp = DAG.getTargetConstant(Imm, CN->getValueType(0));
				843	Base = DAG.getRegister(PPC::R0, CN->getValueType(0));
				844	return true;
				845	}
				846
				847	// Handle 32-bit sext immediates with LIS + addr mode.
				848	if (CN->getValueType(0) == MVT::i32 \|\|
				849	(int64_t)CN->getValue() == (int)CN->getValue()) {
				850	int Addr = (int)CN->getValue();
				851
				852	// Otherwise, break this down into an LIS + disp.
				853	Disp = DAG.getTargetConstant((short)Addr, MVT::i32);
				854
				855	Base = DAG.getTargetConstant((Addr - (signed short)Addr) >> 16, MVT::i32);
				856	unsigned Opc = CN->getValueType(0) == MVT::i32 ? PPC::LIS : PPC::LIS8;
				857	Base = SDOperand(DAG.getTargetNode(Opc, CN->getValueType(0), Base), 0);
				858	return true;
				859	}
				860	}
				861
				862	Disp = DAG.getTargetConstant(0, getPointerTy());
				863	if (FrameIndexSDNode *FI = dyn_cast<FrameIndexSDNode>(N))
				864	Base = DAG.getTargetFrameIndex(FI->getIndex(), N.getValueType());
				865	else
				866	Base = N;
				867	return true; // [r+0]
				868	}
				869
				870	/// SelectAddressRegRegOnly - Given the specified addressed, force it to be
				871	/// represented as an indexed [r+r] operation.
				872	bool PPCTargetLowering::SelectAddressRegRegOnly(SDOperand N, SDOperand &Base,
				873	SDOperand &Index,
				874	SelectionDAG &DAG) {
				875	// Check to see if we can easily represent this as an [r+r] address. This
				876	// will fail if it thinks that the address is more profitably represented as
				877	// reg+imm, e.g. where imm = 0.
				878	if (SelectAddressRegReg(N, Base, Index, DAG))
				879	return true;
				880
				881	// If the operand is an addition, always emit this as [r+r], since this is
				882	// better (for code size, and execution, as the memop does the add for free)
				883	// than emitting an explicit add.
				884	if (N.getOpcode() == ISD::ADD) {
				885	Base = N.getOperand(0);
				886	Index = N.getOperand(1);
				887	return true;
				888	}
				889
				890	// Otherwise, do it the hard way, using R0 as the base register.
				891	Base = DAG.getRegister(PPC::R0, N.getValueType());
				892	Index = N;
				893	return true;
				894	}
				895
				896	/// SelectAddressRegImmShift - Returns true if the address N can be
				897	/// represented by a base register plus a signed 14-bit displacement
				898	/// [r+imm*4]. Suitable for use by STD and friends.
				899	bool PPCTargetLowering::SelectAddressRegImmShift(SDOperand N, SDOperand &Disp,
				900	SDOperand &Base,
				901	SelectionDAG &DAG) {
				902	// If this can be more profitably realized as r+r, fail.
				903	if (SelectAddressRegReg(N, Disp, Base, DAG))
				904	return false;
				905
				906	if (N.getOpcode() == ISD::ADD) {
				907	short imm = 0;
				908	if (isIntS16Immediate(N.getOperand(1), imm) && (imm & 3) == 0) {
				909	Disp = DAG.getTargetConstant(((int)imm & 0xFFFF) >> 2, MVT::i32);
				910	if (FrameIndexSDNode *FI = dyn_cast<FrameIndexSDNode>(N.getOperand(0))) {
				911	Base = DAG.getTargetFrameIndex(FI->getIndex(), N.getValueType());
				912	} else {
				913	Base = N.getOperand(0);
				914	}
				915	return true; // [r+i]
				916	} else if (N.getOperand(1).getOpcode() == PPCISD::Lo) {
				917	// Match LOAD (ADD (X, Lo(G))).
				918	assert(!cast<ConstantSDNode>(N.getOperand(1).getOperand(1))->getValue()
				919	&& "Cannot handle constant offsets yet!");
				920	Disp = N.getOperand(1).getOperand(0); // The global address.
				921	assert(Disp.getOpcode() == ISD::TargetGlobalAddress \|\|
				922	Disp.getOpcode() == ISD::TargetConstantPool \|\|
				923	Disp.getOpcode() == ISD::TargetJumpTable);
				924	Base = N.getOperand(0);
				925	return true; // [&g+r]
				926	}
				927	} else if (N.getOpcode() == ISD::OR) {
				928	short imm = 0;
				929	if (isIntS16Immediate(N.getOperand(1), imm) && (imm & 3) == 0) {
				930	// If this is an or of disjoint bitfields, we can codegen this as an add
				931	// (for better address arithmetic) if the LHS and RHS of the OR are
				932	// provably disjoint.
Dan Gohman	63f4e46	2008-02-27 01:23:58 +0000	[diff] [blame]	933	APInt LHSKnownZero, LHSKnownOne;
				934	DAG.ComputeMaskedBits(N.getOperand(0),
				935	APInt::getAllOnesValue(32),
				936	LHSKnownZero, LHSKnownOne);
				937	if ((LHSKnownZero.getZExtValue()\|~(uint64_t)imm) == ~0ULL) {
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	938	// If all of the bits are known zero on the LHS or RHS, the add won't
				939	// carry.
				940	Base = N.getOperand(0);
				941	Disp = DAG.getTargetConstant(((int)imm & 0xFFFF) >> 2, MVT::i32);
				942	return true;
				943	}
				944	}
				945	} else if (ConstantSDNode *CN = dyn_cast<ConstantSDNode>(N)) {
				946	// Loading from a constant address. Verify low two bits are clear.
				947	if ((CN->getValue() & 3) == 0) {
				948	// If this address fits entirely in a 14-bit sext immediate field, codegen
				949	// this as "d, 0"
				950	short Imm;
				951	if (isIntS16Immediate(CN, Imm)) {
				952	Disp = DAG.getTargetConstant((unsigned short)Imm >> 2, getPointerTy());
				953	Base = DAG.getRegister(PPC::R0, CN->getValueType(0));
				954	return true;
				955	}
				956
				957	// Fold the low-part of 32-bit absolute addresses into addr mode.
				958	if (CN->getValueType(0) == MVT::i32 \|\|
				959	(int64_t)CN->getValue() == (int)CN->getValue()) {
				960	int Addr = (int)CN->getValue();
				961
				962	// Otherwise, break this down into an LIS + disp.
				963	Disp = DAG.getTargetConstant((short)Addr >> 2, MVT::i32);
				964
				965	Base = DAG.getTargetConstant((Addr-(signed short)Addr) >> 16, MVT::i32);
				966	unsigned Opc = CN->getValueType(0) == MVT::i32 ? PPC::LIS : PPC::LIS8;
				967	Base = SDOperand(DAG.getTargetNode(Opc, CN->getValueType(0), Base), 0);
				968	return true;
				969	}
				970	}
				971	}
				972
				973	Disp = DAG.getTargetConstant(0, getPointerTy());
				974	if (FrameIndexSDNode *FI = dyn_cast<FrameIndexSDNode>(N))
				975	Base = DAG.getTargetFrameIndex(FI->getIndex(), N.getValueType());
				976	else
				977	Base = N;
				978	return true; // [r+0]
				979	}
				980
				981
				982	/// getPreIndexedAddressParts - returns true by value, base pointer and
				983	/// offset pointer and addressing mode by reference if the node's address
				984	/// can be legally represented as pre-indexed load / store address.
				985	bool PPCTargetLowering::getPreIndexedAddressParts(SDNode *N, SDOperand &Base,
				986	SDOperand &Offset,
				987	ISD::MemIndexedMode &AM,
				988	SelectionDAG &DAG) {
				989	// Disabled by default for now.
				990	if (!EnablePPCPreinc) return false;
				991
				992	SDOperand Ptr;
				993	MVT::ValueType VT;
				994	if (LoadSDNode *LD = dyn_cast<LoadSDNode>(N)) {
				995	Ptr = LD->getBasePtr();
Dan Gohman	9a4c92c	2008-01-30 00:15:11 +0000	[diff] [blame]	996	VT = LD->getMemoryVT();
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	997
				998	} else if (StoreSDNode *ST = dyn_cast<StoreSDNode>(N)) {
				999	ST = ST;
				1000	Ptr = ST->getBasePtr();
Dan Gohman	9a4c92c	2008-01-30 00:15:11 +0000	[diff] [blame]	1001	VT = ST->getMemoryVT();
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1002	} else
				1003	return false;
				1004
				1005	// PowerPC doesn't have preinc load/store instructions for vectors.
				1006	if (MVT::isVector(VT))
				1007	return false;
				1008
				1009	// TODO: Check reg+reg first.
				1010
				1011	// LDU/STU use reg+imm*4, others use reg+imm.
				1012	if (VT != MVT::i64) {
				1013	// reg + imm
				1014	if (!SelectAddressRegImm(Ptr, Offset, Base, DAG))
				1015	return false;
				1016	} else {
				1017	// reg + imm * 4.
				1018	if (!SelectAddressRegImmShift(Ptr, Offset, Base, DAG))
				1019	return false;
				1020	}
				1021
				1022	if (LoadSDNode *LD = dyn_cast<LoadSDNode>(N)) {
				1023	// PPC64 doesn't have lwau, but it does have lwaux. Reject preinc load of
				1024	// sext i32 to i64 when addr mode is r+i.
Dan Gohman	9a4c92c	2008-01-30 00:15:11 +0000	[diff] [blame]	1025	if (LD->getValueType(0) == MVT::i64 && LD->getMemoryVT() == MVT::i32 &&
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1026	LD->getExtensionType() == ISD::SEXTLOAD &&
				1027	isa<ConstantSDNode>(Offset))
				1028	return false;
				1029	}
				1030
				1031	AM = ISD::PRE_INC;
				1032	return true;
				1033	}
				1034
				1035	//===----------------------------------------------------------------------===//
				1036	// LowerOperation implementation
				1037	//===----------------------------------------------------------------------===//
				1038
Dale Johannesen	8be83a7	2008-03-04 23:17:14 +0000	[diff] [blame]	1039	SDOperand PPCTargetLowering::LowerConstantPool(SDOperand Op,
				1040	SelectionDAG &DAG) {
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1041	MVT::ValueType PtrVT = Op.getValueType();
				1042	ConstantPoolSDNode *CP = cast<ConstantPoolSDNode>(Op);
				1043	Constant *C = CP->getConstVal();
				1044	SDOperand CPI = DAG.getTargetConstantPool(C, PtrVT, CP->getAlignment());
				1045	SDOperand Zero = DAG.getConstant(0, PtrVT);
				1046
				1047	const TargetMachine &TM = DAG.getTarget();
				1048
				1049	SDOperand Hi = DAG.getNode(PPCISD::Hi, PtrVT, CPI, Zero);
				1050	SDOperand Lo = DAG.getNode(PPCISD::Lo, PtrVT, CPI, Zero);
				1051
				1052	// If this is a non-darwin platform, we don't support non-static relo models
				1053	// yet.
				1054	if (TM.getRelocationModel() == Reloc::Static \|\|
				1055	!TM.getSubtarget<PPCSubtarget>().isDarwin()) {
				1056	// Generate non-pic code that has direct accesses to the constant pool.
				1057	// The address of the global is just (hi(&g)+lo(&g)).
				1058	return DAG.getNode(ISD::ADD, PtrVT, Hi, Lo);
				1059	}
				1060
				1061	if (TM.getRelocationModel() == Reloc::PIC_) {
				1062	// With PIC, the first instruction is actually "GR+hi(&G)".
				1063	Hi = DAG.getNode(ISD::ADD, PtrVT,
				1064	DAG.getNode(PPCISD::GlobalBaseReg, PtrVT), Hi);
				1065	}
				1066
				1067	Lo = DAG.getNode(ISD::ADD, PtrVT, Hi, Lo);
				1068	return Lo;
				1069	}
				1070
Dale Johannesen	8be83a7	2008-03-04 23:17:14 +0000	[diff] [blame]	1071	SDOperand PPCTargetLowering::LowerJumpTable(SDOperand Op, SelectionDAG &DAG) {
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1072	MVT::ValueType PtrVT = Op.getValueType();
				1073	JumpTableSDNode *JT = cast<JumpTableSDNode>(Op);
				1074	SDOperand JTI = DAG.getTargetJumpTable(JT->getIndex(), PtrVT);
				1075	SDOperand Zero = DAG.getConstant(0, PtrVT);
				1076
				1077	const TargetMachine &TM = DAG.getTarget();
				1078
				1079	SDOperand Hi = DAG.getNode(PPCISD::Hi, PtrVT, JTI, Zero);
				1080	SDOperand Lo = DAG.getNode(PPCISD::Lo, PtrVT, JTI, Zero);
				1081
				1082	// If this is a non-darwin platform, we don't support non-static relo models
				1083	// yet.
				1084	if (TM.getRelocationModel() == Reloc::Static \|\|
				1085	!TM.getSubtarget<PPCSubtarget>().isDarwin()) {
				1086	// Generate non-pic code that has direct accesses to the constant pool.
				1087	// The address of the global is just (hi(&g)+lo(&g)).
				1088	return DAG.getNode(ISD::ADD, PtrVT, Hi, Lo);
				1089	}
				1090
				1091	if (TM.getRelocationModel() == Reloc::PIC_) {
				1092	// With PIC, the first instruction is actually "GR+hi(&G)".
				1093	Hi = DAG.getNode(ISD::ADD, PtrVT,
				1094	DAG.getNode(PPCISD::GlobalBaseReg, PtrVT), Hi);
				1095	}
				1096
				1097	Lo = DAG.getNode(ISD::ADD, PtrVT, Hi, Lo);
				1098	return Lo;
				1099	}
				1100
Dale Johannesen	8be83a7	2008-03-04 23:17:14 +0000	[diff] [blame]	1101	SDOperand PPCTargetLowering::LowerGlobalTLSAddress(SDOperand Op,
				1102	SelectionDAG &DAG) {
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1103	assert(0 && "TLS not implemented for PPC.");
				1104	}
				1105
Dale Johannesen	8be83a7	2008-03-04 23:17:14 +0000	[diff] [blame]	1106	SDOperand PPCTargetLowering::LowerGlobalAddress(SDOperand Op,
				1107	SelectionDAG &DAG) {
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1108	MVT::ValueType PtrVT = Op.getValueType();
				1109	GlobalAddressSDNode *GSDN = cast<GlobalAddressSDNode>(Op);
				1110	GlobalValue *GV = GSDN->getGlobal();
				1111	SDOperand GA = DAG.getTargetGlobalAddress(GV, PtrVT, GSDN->getOffset());
Evan Cheng	a5a257d	2008-02-02 05:06:29 +0000	[diff] [blame]	1112	// If it's a debug information descriptor, don't mess with it.
				1113	if (DAG.isVerifiedDebugInfoDesc(Op))
				1114	return GA;
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1115	SDOperand Zero = DAG.getConstant(0, PtrVT);
				1116
				1117	const TargetMachine &TM = DAG.getTarget();
				1118
				1119	SDOperand Hi = DAG.getNode(PPCISD::Hi, PtrVT, GA, Zero);
				1120	SDOperand Lo = DAG.getNode(PPCISD::Lo, PtrVT, GA, Zero);
				1121
				1122	// If this is a non-darwin platform, we don't support non-static relo models
				1123	// yet.
				1124	if (TM.getRelocationModel() == Reloc::Static \|\|
				1125	!TM.getSubtarget<PPCSubtarget>().isDarwin()) {
				1126	// Generate non-pic code that has direct accesses to globals.
				1127	// The address of the global is just (hi(&g)+lo(&g)).
				1128	return DAG.getNode(ISD::ADD, PtrVT, Hi, Lo);
				1129	}
				1130
				1131	if (TM.getRelocationModel() == Reloc::PIC_) {
				1132	// With PIC, the first instruction is actually "GR+hi(&G)".
				1133	Hi = DAG.getNode(ISD::ADD, PtrVT,
				1134	DAG.getNode(PPCISD::GlobalBaseReg, PtrVT), Hi);
				1135	}
				1136
				1137	Lo = DAG.getNode(ISD::ADD, PtrVT, Hi, Lo);
				1138
				1139	if (!TM.getSubtarget<PPCSubtarget>().hasLazyResolverStub(GV))
				1140	return Lo;
				1141
				1142	// If the global is weak or external, we have to go through the lazy
				1143	// resolution stub.
				1144	return DAG.getLoad(PtrVT, DAG.getEntryNode(), Lo, NULL, 0);
				1145	}
				1146
Dale Johannesen	8be83a7	2008-03-04 23:17:14 +0000	[diff] [blame]	1147	SDOperand PPCTargetLowering::LowerSETCC(SDOperand Op, SelectionDAG &DAG) {
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1148	ISD::CondCode CC = cast<CondCodeSDNode>(Op.getOperand(2))->get();
				1149
				1150	// If we're comparing for equality to zero, expose the fact that this is
				1151	// implented as a ctlz/srl pair on ppc, so that the dag combiner can
				1152	// fold the new nodes.
				1153	if (ConstantSDNode *C = dyn_cast<ConstantSDNode>(Op.getOperand(1))) {
				1154	if (C->isNullValue() && CC == ISD::SETEQ) {
				1155	MVT::ValueType VT = Op.getOperand(0).getValueType();
				1156	SDOperand Zext = Op.getOperand(0);
				1157	if (VT < MVT::i32) {
				1158	VT = MVT::i32;
				1159	Zext = DAG.getNode(ISD::ZERO_EXTEND, VT, Op.getOperand(0));
				1160	}
				1161	unsigned Log2b = Log2_32(MVT::getSizeInBits(VT));
				1162	SDOperand Clz = DAG.getNode(ISD::CTLZ, VT, Zext);
				1163	SDOperand Scc = DAG.getNode(ISD::SRL, VT, Clz,
				1164	DAG.getConstant(Log2b, MVT::i32));
				1165	return DAG.getNode(ISD::TRUNCATE, MVT::i32, Scc);
				1166	}
				1167	// Leave comparisons against 0 and -1 alone for now, since they're usually
				1168	// optimized. FIXME: revisit this when we can custom lower all setcc
				1169	// optimizations.
				1170	if (C->isAllOnesValue() \|\| C->isNullValue())
				1171	return SDOperand();
				1172	}
				1173
				1174	// If we have an integer seteq/setne, turn it into a compare against zero
				1175	// by xor'ing the rhs with the lhs, which is faster than setting a
				1176	// condition register, reading it back out, and masking the correct bit. The
				1177	// normal approach here uses sub to do this instead of xor. Using xor exposes
				1178	// the result to other bit-twiddling opportunities.
				1179	MVT::ValueType LHSVT = Op.getOperand(0).getValueType();
				1180	if (MVT::isInteger(LHSVT) && (CC == ISD::SETEQ \|\| CC == ISD::SETNE)) {
				1181	MVT::ValueType VT = Op.getValueType();
				1182	SDOperand Sub = DAG.getNode(ISD::XOR, LHSVT, Op.getOperand(0),
				1183	Op.getOperand(1));
				1184	return DAG.getSetCC(VT, Sub, DAG.getConstant(0, LHSVT), CC);
				1185	}
				1186	return SDOperand();
				1187	}
				1188
Dale Johannesen	8be83a7	2008-03-04 23:17:14 +0000	[diff] [blame]	1189	SDOperand PPCTargetLowering::LowerVAARG(SDOperand Op, SelectionDAG &DAG,
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1190	int VarArgsFrameIndex,
				1191	int VarArgsStackOffset,
				1192	unsigned VarArgsNumGPR,
				1193	unsigned VarArgsNumFPR,
				1194	const PPCSubtarget &Subtarget) {
				1195
				1196	assert(0 && "VAARG in ELF32 ABI not implemented yet!");
				1197	}
				1198
Dale Johannesen	8be83a7	2008-03-04 23:17:14 +0000	[diff] [blame]	1199	SDOperand PPCTargetLowering::LowerVASTART(SDOperand Op, SelectionDAG &DAG,
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1200	int VarArgsFrameIndex,
				1201	int VarArgsStackOffset,
				1202	unsigned VarArgsNumGPR,
				1203	unsigned VarArgsNumFPR,
				1204	const PPCSubtarget &Subtarget) {
				1205
				1206	if (Subtarget.isMachoABI()) {
				1207	// vastart just stores the address of the VarArgsFrameIndex slot into the
				1208	// memory location argument.
				1209	MVT::ValueType PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
				1210	SDOperand FR = DAG.getFrameIndex(VarArgsFrameIndex, PtrVT);
Dan Gohman	12a9c08	2008-02-06 22:27:42 +0000	[diff] [blame]	1211	const Value *SV = cast<SrcValueSDNode>(Op.getOperand(2))->getValue();
				1212	return DAG.getStore(Op.getOperand(0), FR, Op.getOperand(1), SV, 0);
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1213	}
				1214
				1215	// For ELF 32 ABI we follow the layout of the va_list struct.
				1216	// We suppose the given va_list is already allocated.
				1217	//
				1218	// typedef struct {
				1219	// char gpr; /* index into the array of 8 GPRs
				1220	// * stored in the register save area
				1221	// * gpr=0 corresponds to r3,
				1222	// * gpr=1 to r4, etc.
				1223	// */
				1224	// char fpr; /* index into the array of 8 FPRs
				1225	// * stored in the register save area
				1226	// * fpr=0 corresponds to f1,
				1227	// * fpr=1 to f2, etc.
				1228	// */
				1229	// char *overflow_arg_area;
				1230	// /* location on stack that holds
				1231	// * the next overflow argument
				1232	// */
				1233	// char *reg_save_area;
				1234	// /* where r3:r10 and f1:f8 (if saved)
				1235	// * are stored
				1236	// */
				1237	// } va_list[1];
				1238
				1239
				1240	SDOperand ArgGPR = DAG.getConstant(VarArgsNumGPR, MVT::i8);
				1241	SDOperand ArgFPR = DAG.getConstant(VarArgsNumFPR, MVT::i8);
				1242
				1243
				1244	MVT::ValueType PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
				1245
Dan Gohman	12a9c08	2008-02-06 22:27:42 +0000	[diff] [blame]	1246	SDOperand StackOffsetFI = DAG.getFrameIndex(VarArgsStackOffset, PtrVT);
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1247	SDOperand FR = DAG.getFrameIndex(VarArgsFrameIndex, PtrVT);
				1248
Dan Gohman	12a9c08	2008-02-06 22:27:42 +0000	[diff] [blame]	1249	uint64_t FrameOffset = MVT::getSizeInBits(PtrVT)/8;
				1250	SDOperand ConstFrameOffset = DAG.getConstant(FrameOffset, PtrVT);
				1251
				1252	uint64_t StackOffset = MVT::getSizeInBits(PtrVT)/8 - 1;
				1253	SDOperand ConstStackOffset = DAG.getConstant(StackOffset, PtrVT);
				1254
				1255	uint64_t FPROffset = 1;
				1256	SDOperand ConstFPROffset = DAG.getConstant(FPROffset, PtrVT);
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1257
Dan Gohman	12a9c08	2008-02-06 22:27:42 +0000	[diff] [blame]	1258	const Value *SV = cast<SrcValueSDNode>(Op.getOperand(2))->getValue();
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1259
				1260	// Store first byte : number of int regs
				1261	SDOperand firstStore = DAG.getStore(Op.getOperand(0), ArgGPR,
Dan Gohman	12a9c08	2008-02-06 22:27:42 +0000	[diff] [blame]	1262	Op.getOperand(1), SV, 0);
				1263	uint64_t nextOffset = FPROffset;
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1264	SDOperand nextPtr = DAG.getNode(ISD::ADD, PtrVT, Op.getOperand(1),
				1265	ConstFPROffset);
				1266
				1267	// Store second byte : number of float regs
Dan Gohman	12a9c08	2008-02-06 22:27:42 +0000	[diff] [blame]	1268	SDOperand secondStore =
				1269	DAG.getStore(firstStore, ArgFPR, nextPtr, SV, nextOffset);
				1270	nextOffset += StackOffset;
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1271	nextPtr = DAG.getNode(ISD::ADD, PtrVT, nextPtr, ConstStackOffset);
				1272
				1273	// Store second word : arguments given on stack
Dan Gohman	12a9c08	2008-02-06 22:27:42 +0000	[diff] [blame]	1274	SDOperand thirdStore =
				1275	DAG.getStore(secondStore, StackOffsetFI, nextPtr, SV, nextOffset);
				1276	nextOffset += FrameOffset;
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1277	nextPtr = DAG.getNode(ISD::ADD, PtrVT, nextPtr, ConstFrameOffset);
				1278
				1279	// Store third word : arguments given in registers
Dan Gohman	12a9c08	2008-02-06 22:27:42 +0000	[diff] [blame]	1280	return DAG.getStore(thirdStore, FR, nextPtr, SV, nextOffset);
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1281
				1282	}
				1283
				1284	#include "PPCGenCallingConv.inc"
				1285
				1286	/// GetFPR - Get the set of FP registers that should be allocated for arguments,
				1287	/// depending on which subtarget is selected.
				1288	static const unsigned *GetFPR(const PPCSubtarget &Subtarget) {
				1289	if (Subtarget.isMachoABI()) {
				1290	static const unsigned FPR[] = {
				1291	PPC::F1, PPC::F2, PPC::F3, PPC::F4, PPC::F5, PPC::F6, PPC::F7,
				1292	PPC::F8, PPC::F9, PPC::F10, PPC::F11, PPC::F12, PPC::F13
				1293	};
				1294	return FPR;
				1295	}
				1296
				1297
				1298	static const unsigned FPR[] = {
				1299	PPC::F1, PPC::F2, PPC::F3, PPC::F4, PPC::F5, PPC::F6, PPC::F7,
				1300	PPC::F8
				1301	};
				1302	return FPR;
				1303	}
				1304
Bill Wendling	b0edf3d	2008-03-07 20:49:02 +0000	[diff] [blame]	1305	SDOperand
				1306	PPCTargetLowering::LowerFORMAL_ARGUMENTS(SDOperand Op,
				1307	SelectionDAG &DAG,
				1308	int &VarArgsFrameIndex,
				1309	int &VarArgsStackOffset,
				1310	unsigned &VarArgsNumGPR,
				1311	unsigned &VarArgsNumFPR,
				1312	const PPCSubtarget &Subtarget) {
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1313	// TODO: add description of PPC stack frame format, or at least some docs.
				1314	//
				1315	MachineFunction &MF = DAG.getMachineFunction();
				1316	MachineFrameInfo *MFI = MF.getFrameInfo();
Chris Lattner	1b98919	2007-12-31 04:13:23 +0000	[diff] [blame]	1317	MachineRegisterInfo &RegInfo = MF.getRegInfo();
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1318	SmallVector<SDOperand, 8> ArgValues;
				1319	SDOperand Root = Op.getOperand(0);
Dale Johannesen	946b9cc	2008-03-12 00:22:17 +0000	[diff] [blame]	1320	bool isVarArg = cast<ConstantSDNode>(Op.getOperand(2))->getValue() != 0;
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1321
				1322	MVT::ValueType PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
				1323	bool isPPC64 = PtrVT == MVT::i64;
				1324	bool isMachoABI = Subtarget.isMachoABI();
				1325	bool isELF32_ABI = Subtarget.isELF32_ABI();
				1326	unsigned PtrByteSize = isPPC64 ? 8 : 4;
				1327
				1328	unsigned ArgOffset = PPCFrameInfo::getLinkageSize(isPPC64, isMachoABI);
				1329
				1330	static const unsigned GPR_32[] = { // 32-bit registers.
				1331	PPC::R3, PPC::R4, PPC::R5, PPC::R6,
				1332	PPC::R7, PPC::R8, PPC::R9, PPC::R10,
				1333	};
				1334	static const unsigned GPR_64[] = { // 64-bit registers.
				1335	PPC::X3, PPC::X4, PPC::X5, PPC::X6,
				1336	PPC::X7, PPC::X8, PPC::X9, PPC::X10,
				1337	};
				1338
				1339	static const unsigned *FPR = GetFPR(Subtarget);
				1340
				1341	static const unsigned VR[] = {
				1342	PPC::V2, PPC::V3, PPC::V4, PPC::V5, PPC::V6, PPC::V7, PPC::V8,
				1343	PPC::V9, PPC::V10, PPC::V11, PPC::V12, PPC::V13
				1344	};
				1345
Owen Anderson	1636de9	2007-09-07 04:06:50 +0000	[diff] [blame]	1346	const unsigned Num_GPR_Regs = array_lengthof(GPR_32);
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1347	const unsigned Num_FPR_Regs = isMachoABI ? 13 : 8;
Owen Anderson	1636de9	2007-09-07 04:06:50 +0000	[diff] [blame]	1348	const unsigned Num_VR_Regs = array_lengthof( VR);
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1349
				1350	unsigned GPR_idx = 0, FPR_idx = 0, VR_idx = 0;
				1351
				1352	const unsigned *GPR = isPPC64 ? GPR_64 : GPR_32;
				1353
Dale Johannesen	f6a394b	2008-03-14 17:41:26 +0000	[diff] [blame]	1354	// In 32-bit non-varargs functions, the stack space for vectors is after the
				1355	// stack space for non-vectors. We do not use this space unless we have
				1356	// too many vectors to fit in registers, something that only occurs in
				1357	// constructed examples:), but we have to walk the arglist to figure
				1358	// that out...for the pathological case, compute VecArgOffset as the
				1359	// start of the vector parameter area. Computing VecArgOffset is the
				1360	// entire point of the following loop.
				1361	// Altivec is not mentioned in the ppc32 Elf Supplement, so I'm not trying
				1362	// to handle Elf here.
				1363	unsigned VecArgOffset = ArgOffset;
				1364	if (!isVarArg && !isPPC64) {
				1365	for (unsigned ArgNo = 0, e = Op.Val->getNumValues()-1; ArgNo != e;
				1366	++ArgNo) {
				1367	MVT::ValueType ObjectVT = Op.getValue(ArgNo).getValueType();
				1368	unsigned ObjSize = MVT::getSizeInBits(ObjectVT)/8;
				1369	ISD::ParamFlags::ParamFlagsTy Flags =
				1370	cast<ConstantSDNode>(Op.getOperand(ArgNo+3))->getValue();
				1371	unsigned isByVal = Flags & ISD::ParamFlags::ByVal;
				1372
				1373	if (isByVal) {
				1374	// ObjSize is the true size, ArgSize rounded up to multiple of regs.
				1375	ObjSize = (Flags & ISD::ParamFlags::ByValSize) >>
				1376	ISD::ParamFlags::ByValSizeOffs;
				1377	unsigned ArgSize =
				1378	((ObjSize + PtrByteSize - 1)/PtrByteSize) * PtrByteSize;
				1379	VecArgOffset += ArgSize;
				1380	continue;
				1381	}
				1382
				1383	switch(ObjectVT) {
				1384	default: assert(0 && "Unhandled argument type!");
				1385	case MVT::i32:
				1386	case MVT::f32:
				1387	VecArgOffset += isPPC64 ? 8 : 4;
				1388	break;
				1389	case MVT::i64: // PPC64
				1390	case MVT::f64:
				1391	VecArgOffset += 8;
				1392	break;
				1393	case MVT::v4f32:
				1394	case MVT::v4i32:
				1395	case MVT::v8i16:
				1396	case MVT::v16i8:
				1397	// Nothing to do, we're only looking at Nonvector args here.
				1398	break;
				1399	}
				1400	}
				1401	}
				1402	// We've found where the vector parameter area in memory is. Skip the
				1403	// first 12 parameters; these don't use that memory.
				1404	VecArgOffset = ((VecArgOffset+15)/16)*16;
				1405	VecArgOffset += 12*16;
				1406
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1407	// Add DAG nodes to load the arguments or copy them out of registers. On
				1408	// entry to a function on PPC, the arguments start after the linkage area,
				1409	// although the first ones are often in registers.
				1410	//
				1411	// In the ELF 32 ABI, GPRs and stack are double word align: an argument
				1412	// represented with two words (long long or double) must be copied to an
				1413	// even GPR_idx value or to an even ArgOffset value.
				1414
Dale Johannesen	eaea88c	2008-03-07 20:27:40 +0000	[diff] [blame]	1415	SmallVector<SDOperand, 8> MemOps;
				1416
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1417	for (unsigned ArgNo = 0, e = Op.Val->getNumValues()-1; ArgNo != e; ++ArgNo) {
				1418	SDOperand ArgVal;
				1419	bool needsLoad = false;
				1420	MVT::ValueType ObjectVT = Op.getValue(ArgNo).getValueType();
				1421	unsigned ObjSize = MVT::getSizeInBits(ObjectVT)/8;
				1422	unsigned ArgSize = ObjSize;
Dale Johannesen	322e3b7	2008-03-10 02:17:22 +0000	[diff] [blame]	1423	ISD::ParamFlags::ParamFlagsTy Flags =
				1424	cast<ConstantSDNode>(Op.getOperand(ArgNo+3))->getValue();
				1425	unsigned AlignFlag = ISD::ParamFlags::One
				1426	<< ISD::ParamFlags::OrigAlignmentOffs;
Dale Johannesen	eaea88c	2008-03-07 20:27:40 +0000	[diff] [blame]	1427	unsigned isByVal = Flags & ISD::ParamFlags::ByVal;
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1428	// See if next argument requires stack alignment in ELF
				1429	bool Expand = (ObjectVT == MVT::f64) \|\| ((ArgNo + 1 < e) &&
				1430	(cast<ConstantSDNode>(Op.getOperand(ArgNo+4))->getValue() & AlignFlag) &&
				1431	(!(Flags & AlignFlag)));
				1432
				1433	unsigned CurArgOffset = ArgOffset;
Dale Johannesen	eaea88c	2008-03-07 20:27:40 +0000	[diff] [blame]	1434
				1435	// FIXME alignment for ELF may not be right
				1436	// FIXME the codegen can be much improved in some cases.
				1437	// We do not have to keep everything in memory.
				1438	if (isByVal) {
Dale Johannesen	eaea88c	2008-03-07 20:27:40 +0000	[diff] [blame]	1439	// ObjSize is the true size, ArgSize rounded up to multiple of registers.
				1440	ObjSize = (Flags & ISD::ParamFlags::ByValSize) >>
				1441	ISD::ParamFlags::ByValSizeOffs;
				1442	ArgSize = ((ObjSize + PtrByteSize - 1)/PtrByteSize) * PtrByteSize;
Dale Johannesen	05b4dbc	2008-03-08 01:41:42 +0000	[diff] [blame]	1443	// Double word align in ELF
				1444	if (Expand && isELF32_ABI) GPR_idx += (GPR_idx % 2);
				1445	// Objects of size 1 and 2 are right justified, everything else is
				1446	// left justified. This means the memory address is adjusted forwards.
				1447	if (ObjSize==1 \|\| ObjSize==2) {
				1448	CurArgOffset = CurArgOffset + (4 - ObjSize);
				1449	}
Dale Johannesen	eaea88c	2008-03-07 20:27:40 +0000	[diff] [blame]	1450	// The value of the object is its address.
				1451	int FI = MFI->CreateFixedObject(ObjSize, CurArgOffset);
				1452	SDOperand FIN = DAG.getFrameIndex(FI, PtrVT);
				1453	ArgValues.push_back(FIN);
Dale Johannesen	05b4dbc	2008-03-08 01:41:42 +0000	[diff] [blame]	1454	if (ObjSize==1 \|\| ObjSize==2) {
				1455	if (GPR_idx != Num_GPR_Regs) {
				1456	unsigned VReg = RegInfo.createVirtualRegister(&PPC::GPRCRegClass);
				1457	RegInfo.addLiveIn(GPR[GPR_idx], VReg);
				1458	SDOperand Val = DAG.getCopyFromReg(Root, VReg, PtrVT);
				1459	SDOperand Store = DAG.getTruncStore(Val.getValue(1), Val, FIN,
				1460	NULL, 0, ObjSize==1 ? MVT::i8 : MVT::i16 );
				1461	MemOps.push_back(Store);
				1462	++GPR_idx;
				1463	if (isMachoABI) ArgOffset += PtrByteSize;
				1464	} else {
				1465	ArgOffset += PtrByteSize;
				1466	}
				1467	continue;
				1468	}
Dale Johannesen	eaea88c	2008-03-07 20:27:40 +0000	[diff] [blame]	1469	for (unsigned j = 0; j < ArgSize; j += PtrByteSize) {
				1470	// Store whatever pieces of the object are in registers
				1471	// to memory. ArgVal will be address of the beginning of
				1472	// the object.
				1473	if (GPR_idx != Num_GPR_Regs) {
				1474	unsigned VReg = RegInfo.createVirtualRegister(&PPC::GPRCRegClass);
				1475	RegInfo.addLiveIn(GPR[GPR_idx], VReg);
				1476	int FI = MFI->CreateFixedObject(PtrByteSize, ArgOffset);
				1477	SDOperand FIN = DAG.getFrameIndex(FI, PtrVT);
				1478	SDOperand Val = DAG.getCopyFromReg(Root, VReg, PtrVT);
				1479	SDOperand Store = DAG.getStore(Val.getValue(1), Val, FIN, NULL, 0);
				1480	MemOps.push_back(Store);
				1481	++GPR_idx;
				1482	if (isMachoABI) ArgOffset += PtrByteSize;
				1483	} else {
				1484	ArgOffset += ArgSize - (ArgOffset-CurArgOffset);
				1485	break;
				1486	}
				1487	}
				1488	continue;
				1489	}
				1490
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1491	switch (ObjectVT) {
				1492	default: assert(0 && "Unhandled argument type!");
				1493	case MVT::i32:
Bill Wendling	b0edf3d	2008-03-07 20:49:02 +0000	[diff] [blame]	1494	if (!isPPC64) {
				1495	// Double word align in ELF
				1496	if (Expand && isELF32_ABI) GPR_idx += (GPR_idx % 2);
				1497
				1498	if (GPR_idx != Num_GPR_Regs) {
				1499	unsigned VReg = RegInfo.createVirtualRegister(&PPC::GPRCRegClass);
				1500	RegInfo.addLiveIn(GPR[GPR_idx], VReg);
				1501	ArgVal = DAG.getCopyFromReg(Root, VReg, MVT::i32);
				1502	++GPR_idx;
				1503	} else {
				1504	needsLoad = true;
				1505	ArgSize = PtrByteSize;
				1506	}
				1507	// Stack align in ELF
				1508	if (needsLoad && Expand && isELF32_ABI)
				1509	ArgOffset += ((ArgOffset/4) % 2) * PtrByteSize;
				1510	// All int arguments reserve stack space in Macho ABI.
				1511	if (isMachoABI \|\| needsLoad) ArgOffset += PtrByteSize;
				1512	break;
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1513	}
Bill Wendling	b0edf3d	2008-03-07 20:49:02 +0000	[diff] [blame]	1514	// FALLTHROUGH
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1515	case MVT::i64: // PPC64
				1516	if (GPR_idx != Num_GPR_Regs) {
Chris Lattner	1b98919	2007-12-31 04:13:23 +0000	[diff] [blame]	1517	unsigned VReg = RegInfo.createVirtualRegister(&PPC::G8RCRegClass);
				1518	RegInfo.addLiveIn(GPR[GPR_idx], VReg);
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1519	ArgVal = DAG.getCopyFromReg(Root, VReg, MVT::i64);
Bill Wendling	b0edf3d	2008-03-07 20:49:02 +0000	[diff] [blame]	1520
				1521	if (ObjectVT == MVT::i32) {
				1522	// PPC64 passes i8, i16, and i32 values in i64 registers. Promote
				1523	// value to MVT::i64 and then truncate to the correct register size.
				1524	if (Flags & ISD::ParamFlags::SExt)
				1525	ArgVal = DAG.getNode(ISD::AssertSext, MVT::i64, ArgVal,
				1526	DAG.getValueType(ObjectVT));
				1527	else if (Flags & ISD::ParamFlags::ZExt)
				1528	ArgVal = DAG.getNode(ISD::AssertZext, MVT::i64, ArgVal,
				1529	DAG.getValueType(ObjectVT));
				1530
				1531	ArgVal = DAG.getNode(ISD::TRUNCATE, MVT::i32, ArgVal);
				1532	}
				1533
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1534	++GPR_idx;
				1535	} else {
				1536	needsLoad = true;
				1537	}
				1538	// All int arguments reserve stack space in Macho ABI.
				1539	if (isMachoABI \|\| needsLoad) ArgOffset += 8;
				1540	break;
				1541
				1542	case MVT::f32:
				1543	case MVT::f64:
				1544	// Every 4 bytes of argument space consumes one of the GPRs available for
				1545	// argument passing.
				1546	if (GPR_idx != Num_GPR_Regs && isMachoABI) {
				1547	++GPR_idx;
				1548	if (ObjSize == 8 && GPR_idx != Num_GPR_Regs && !isPPC64)
				1549	++GPR_idx;
				1550	}
				1551	if (FPR_idx != Num_FPR_Regs) {
				1552	unsigned VReg;
				1553	if (ObjectVT == MVT::f32)
Chris Lattner	1b98919	2007-12-31 04:13:23 +0000	[diff] [blame]	1554	VReg = RegInfo.createVirtualRegister(&PPC::F4RCRegClass);
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1555	else
Chris Lattner	1b98919	2007-12-31 04:13:23 +0000	[diff] [blame]	1556	VReg = RegInfo.createVirtualRegister(&PPC::F8RCRegClass);
				1557	RegInfo.addLiveIn(FPR[FPR_idx], VReg);
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1558	ArgVal = DAG.getCopyFromReg(Root, VReg, ObjectVT);
				1559	++FPR_idx;
				1560	} else {
				1561	needsLoad = true;
				1562	}
				1563
				1564	// Stack align in ELF
				1565	if (needsLoad && Expand && isELF32_ABI)
				1566	ArgOffset += ((ArgOffset/4) % 2) * PtrByteSize;
				1567	// All FP arguments reserve stack space in Macho ABI.
				1568	if (isMachoABI \|\| needsLoad) ArgOffset += isPPC64 ? 8 : ObjSize;
				1569	break;
				1570	case MVT::v4f32:
				1571	case MVT::v4i32:
				1572	case MVT::v8i16:
				1573	case MVT::v16i8:
Dale Johannesen	946b9cc	2008-03-12 00:22:17 +0000	[diff] [blame]	1574	// Note that vector arguments in registers don't reserve stack space,
				1575	// except in varargs functions.
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1576	if (VR_idx != Num_VR_Regs) {
Chris Lattner	1b98919	2007-12-31 04:13:23 +0000	[diff] [blame]	1577	unsigned VReg = RegInfo.createVirtualRegister(&PPC::VRRCRegClass);
				1578	RegInfo.addLiveIn(VR[VR_idx], VReg);
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1579	ArgVal = DAG.getCopyFromReg(Root, VReg, ObjectVT);
Dale Johannesen	946b9cc	2008-03-12 00:22:17 +0000	[diff] [blame]	1580	if (isVarArg) {
				1581	while ((ArgOffset % 16) != 0) {
				1582	ArgOffset += PtrByteSize;
				1583	if (GPR_idx != Num_GPR_Regs)
				1584	GPR_idx++;
				1585	}
				1586	ArgOffset += 16;
				1587	GPR_idx = std::min(GPR_idx+4, Num_GPR_Regs);
				1588	}
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1589	++VR_idx;
				1590	} else {
Dale Johannesen	f6a394b	2008-03-14 17:41:26 +0000	[diff] [blame]	1591	if (!isVarArg && !isPPC64) {
				1592	// Vectors go after all the nonvectors.
				1593	CurArgOffset = VecArgOffset;
				1594	VecArgOffset += 16;
				1595	} else {
				1596	// Vectors are aligned.
				1597	ArgOffset = ((ArgOffset+15)/16)*16;
				1598	CurArgOffset = ArgOffset;
				1599	ArgOffset += 16;
Dale Johannesen	896870b	2008-03-12 00:49:20 +0000	[diff] [blame]	1600	}
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1601	needsLoad = true;
				1602	}
				1603	break;
				1604	}
				1605
				1606	// We need to load the argument to a virtual register if we determined above
Chris Lattner	6006945	2008-02-13 07:35:30 +0000	[diff] [blame]	1607	// that we ran out of physical registers of the appropriate type.
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1608	if (needsLoad) {
Chris Lattner	6006945	2008-02-13 07:35:30 +0000	[diff] [blame]	1609	int FI = MFI->CreateFixedObject(ObjSize,
				1610	CurArgOffset + (ArgSize - ObjSize));
				1611	SDOperand FIN = DAG.getFrameIndex(FI, PtrVT);
				1612	ArgVal = DAG.getLoad(ObjectVT, Root, FIN, NULL, 0);
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1613	}
				1614
				1615	ArgValues.push_back(ArgVal);
				1616	}
Dale Johannesen	eaea88c	2008-03-07 20:27:40 +0000	[diff] [blame]	1617
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1618	// If the function takes variable number of arguments, make a frame index for
				1619	// the start of the first vararg value... for expansion of llvm.va_start.
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1620	if (isVarArg) {
				1621
				1622	int depth;
				1623	if (isELF32_ABI) {
				1624	VarArgsNumGPR = GPR_idx;
				1625	VarArgsNumFPR = FPR_idx;
				1626
				1627	// Make room for Num_GPR_Regs, Num_FPR_Regs and for a possible frame
				1628	// pointer.
				1629	depth = -(Num_GPR_Regs * MVT::getSizeInBits(PtrVT)/8 +
				1630	Num_FPR_Regs * MVT::getSizeInBits(MVT::f64)/8 +
				1631	MVT::getSizeInBits(PtrVT)/8);
				1632
				1633	VarArgsStackOffset = MFI->CreateFixedObject(MVT::getSizeInBits(PtrVT)/8,
				1634	ArgOffset);
				1635
				1636	}
				1637	else
				1638	depth = ArgOffset;
				1639
				1640	VarArgsFrameIndex = MFI->CreateFixedObject(MVT::getSizeInBits(PtrVT)/8,
				1641	depth);
				1642	SDOperand FIN = DAG.getFrameIndex(VarArgsFrameIndex, PtrVT);
				1643
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1644	// In ELF 32 ABI, the fixed integer arguments of a variadic function are
				1645	// stored to the VarArgsFrameIndex on the stack.
				1646	if (isELF32_ABI) {
				1647	for (GPR_idx = 0; GPR_idx != VarArgsNumGPR; ++GPR_idx) {
				1648	SDOperand Val = DAG.getRegister(GPR[GPR_idx], PtrVT);
				1649	SDOperand Store = DAG.getStore(Root, Val, FIN, NULL, 0);
				1650	MemOps.push_back(Store);
				1651	// Increment the address by four for the next argument to store
				1652	SDOperand PtrOff = DAG.getConstant(MVT::getSizeInBits(PtrVT)/8, PtrVT);
				1653	FIN = DAG.getNode(ISD::ADD, PtrOff.getValueType(), FIN, PtrOff);
				1654	}
				1655	}
				1656
				1657	// If this function is vararg, store any remaining integer argument regs
				1658	// to their spots on the stack so that they may be loaded by deferencing the
				1659	// result of va_next.
				1660	for (; GPR_idx != Num_GPR_Regs; ++GPR_idx) {
				1661	unsigned VReg;
				1662	if (isPPC64)
Chris Lattner	1b98919	2007-12-31 04:13:23 +0000	[diff] [blame]	1663	VReg = RegInfo.createVirtualRegister(&PPC::G8RCRegClass);
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1664	else
Chris Lattner	1b98919	2007-12-31 04:13:23 +0000	[diff] [blame]	1665	VReg = RegInfo.createVirtualRegister(&PPC::GPRCRegClass);
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1666
Chris Lattner	1b98919	2007-12-31 04:13:23 +0000	[diff] [blame]	1667	RegInfo.addLiveIn(GPR[GPR_idx], VReg);
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1668	SDOperand Val = DAG.getCopyFromReg(Root, VReg, PtrVT);
				1669	SDOperand Store = DAG.getStore(Val.getValue(1), Val, FIN, NULL, 0);
				1670	MemOps.push_back(Store);
				1671	// Increment the address by four for the next argument to store
				1672	SDOperand PtrOff = DAG.getConstant(MVT::getSizeInBits(PtrVT)/8, PtrVT);
				1673	FIN = DAG.getNode(ISD::ADD, PtrOff.getValueType(), FIN, PtrOff);
				1674	}
				1675
				1676	// In ELF 32 ABI, the double arguments are stored to the VarArgsFrameIndex
				1677	// on the stack.
				1678	if (isELF32_ABI) {
				1679	for (FPR_idx = 0; FPR_idx != VarArgsNumFPR; ++FPR_idx) {
				1680	SDOperand Val = DAG.getRegister(FPR[FPR_idx], MVT::f64);
				1681	SDOperand Store = DAG.getStore(Root, Val, FIN, NULL, 0);
				1682	MemOps.push_back(Store);
				1683	// Increment the address by eight for the next argument to store
				1684	SDOperand PtrOff = DAG.getConstant(MVT::getSizeInBits(MVT::f64)/8,
				1685	PtrVT);
				1686	FIN = DAG.getNode(ISD::ADD, PtrOff.getValueType(), FIN, PtrOff);
				1687	}
				1688
				1689	for (; FPR_idx != Num_FPR_Regs; ++FPR_idx) {
				1690	unsigned VReg;
Chris Lattner	1b98919	2007-12-31 04:13:23 +0000	[diff] [blame]	1691	VReg = RegInfo.createVirtualRegister(&PPC::F8RCRegClass);
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1692
Chris Lattner	1b98919	2007-12-31 04:13:23 +0000	[diff] [blame]	1693	RegInfo.addLiveIn(FPR[FPR_idx], VReg);
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1694	SDOperand Val = DAG.getCopyFromReg(Root, VReg, MVT::f64);
				1695	SDOperand Store = DAG.getStore(Val.getValue(1), Val, FIN, NULL, 0);
				1696	MemOps.push_back(Store);
				1697	// Increment the address by eight for the next argument to store
				1698	SDOperand PtrOff = DAG.getConstant(MVT::getSizeInBits(MVT::f64)/8,
				1699	PtrVT);
				1700	FIN = DAG.getNode(ISD::ADD, PtrOff.getValueType(), FIN, PtrOff);
				1701	}
				1702	}
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1703	}
				1704
Dale Johannesen	eaea88c	2008-03-07 20:27:40 +0000	[diff] [blame]	1705	if (!MemOps.empty())
				1706	Root = DAG.getNode(ISD::TokenFactor, MVT::Other,&MemOps[0],MemOps.size());
				1707
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1708	ArgValues.push_back(Root);
				1709
				1710	// Return the new list of results.
				1711	std::vector<MVT::ValueType> RetVT(Op.Val->value_begin(),
				1712	Op.Val->value_end());
				1713	return DAG.getNode(ISD::MERGE_VALUES, RetVT, &ArgValues[0], ArgValues.size());
				1714	}
				1715
				1716	/// isCallCompatibleAddress - Return the immediate to use if the specified
				1717	/// 32-bit value is representable in the immediate field of a BxA instruction.
				1718	static SDNode *isBLACompatibleAddress(SDOperand Op, SelectionDAG &DAG) {
				1719	ConstantSDNode *C = dyn_cast<ConstantSDNode>(Op);
				1720	if (!C) return 0;
				1721
				1722	int Addr = C->getValue();
				1723	if ((Addr & 3) != 0 \|\| // Low 2 bits are implicitly zero.
				1724	(Addr << 6 >> 6) != Addr)
				1725	return 0; // Top 6 bits have to be sext of immediate.
				1726
Evan Cheng	282c646	2007-10-22 19:46:19 +0000	[diff] [blame]	1727	return DAG.getConstant((int)C->getValue() >> 2,
				1728	DAG.getTargetLoweringInfo().getPointerTy()).Val;
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1729	}
				1730
Dale Johannesen	8be83a7	2008-03-04 23:17:14 +0000	[diff] [blame]	1731	/// CreateCopyOfByValArgument - Make a copy of an aggregate at address specified
				1732	/// by "Src" to address "Dst" of size "Size". Alignment information is
				1733	/// specified by the specific parameter attribute. The copy will be passed as
				1734	/// a byval function parameter.
				1735	/// Sometimes what we are copying is the end of a larger object, the part that
				1736	/// does not fit in registers.
				1737	static SDOperand
				1738	CreateCopyOfByValArgument(SDOperand Src, SDOperand Dst, SDOperand Chain,
Dale Johannesen	322e3b7	2008-03-10 02:17:22 +0000	[diff] [blame]	1739	ISD::ParamFlags::ParamFlagsTy Flags,
				1740	SelectionDAG &DAG, unsigned Size) {
				1741	unsigned Align = ISD::ParamFlags::One <<
Dale Johannesen	8be83a7	2008-03-04 23:17:14 +0000	[diff] [blame]	1742	((Flags & ISD::ParamFlags::ByValAlign) >> ISD::ParamFlags::ByValAlignOffs);
				1743	SDOperand AlignNode = DAG.getConstant(Align, MVT::i32);
				1744	SDOperand SizeNode = DAG.getConstant(Size, MVT::i32);
Dale Johannesen	7a7aa10	2008-03-05 23:31:27 +0000	[diff] [blame]	1745	SDOperand AlwaysInline = DAG.getConstant(0, MVT::i32);
Dale Johannesen	8be83a7	2008-03-04 23:17:14 +0000	[diff] [blame]	1746	return DAG.getMemcpy(Chain, Dst, Src, SizeNode, AlignNode, AlwaysInline);
				1747	}
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1748
Dale Johannesen	8be83a7	2008-03-04 23:17:14 +0000	[diff] [blame]	1749	SDOperand PPCTargetLowering::LowerCALL(SDOperand Op, SelectionDAG &DAG,
				1750	const PPCSubtarget &Subtarget) {
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1751	SDOperand Chain = Op.getOperand(0);
				1752	bool isVarArg = cast<ConstantSDNode>(Op.getOperand(2))->getValue() != 0;
				1753	SDOperand Callee = Op.getOperand(4);
				1754	unsigned NumOps = (Op.getNumOperands() - 5) / 2;
				1755
				1756	bool isMachoABI = Subtarget.isMachoABI();
				1757	bool isELF32_ABI = Subtarget.isELF32_ABI();
				1758
				1759	MVT::ValueType PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
				1760	bool isPPC64 = PtrVT == MVT::i64;
				1761	unsigned PtrByteSize = isPPC64 ? 8 : 4;
				1762
				1763	// args_to_use will accumulate outgoing args for the PPCISD::CALL case in
				1764	// SelectExpr to use to put the arguments in the appropriate registers.
				1765	std::vector<SDOperand> args_to_use;
				1766
				1767	// Count how many bytes are to be pushed on the stack, including the linkage
				1768	// area, and parameter passing area. We start with 24/48 bytes, which is
				1769	// prereserved space for [SP][CR][LR][3 x unused].
				1770	unsigned NumBytes = PPCFrameInfo::getLinkageSize(isPPC64, isMachoABI);
Dale Johannesen	946b9cc	2008-03-12 00:22:17 +0000	[diff] [blame]	1771
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1772	// Add up all the space actually used.
Dale Johannesen	f6a394b	2008-03-14 17:41:26 +0000	[diff] [blame]	1773	// In 32-bit non-varargs calls, Altivec parameters all go at the end; usually
				1774	// they all go in registers, but we must reserve stack space for them for
				1775	// possible use by the caller. In varargs or 64-bit calls, parameters are
				1776	// assigned stack space in order, with padding so Altivec parameters are
				1777	// 16-byte aligned.
				1778	unsigned nAltivecParamsAtEnd = 0;
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1779	for (unsigned i = 0; i != NumOps; ++i) {
Dale Johannesen	946b9cc	2008-03-12 00:22:17 +0000	[diff] [blame]	1780	SDOperand Arg = Op.getOperand(5+2*i);
				1781	MVT::ValueType ArgVT = Arg.getValueType();
Dale Johannesen	f6a394b	2008-03-14 17:41:26 +0000	[diff] [blame]	1782	if (ArgVT==MVT::v4f32 \|\| ArgVT==MVT::v4i32 \|\|
				1783	ArgVT==MVT::v8i16 \|\| ArgVT==MVT::v16i8) {
				1784	if (!isVarArg && !isPPC64) {
				1785	// Non-varargs Altivec parameters go after all the non-Altivec parameters;
				1786	// do those last so we know how much padding we need.
				1787	nAltivecParamsAtEnd++;
				1788	continue;
				1789	} else {
				1790	// Varargs and 64-bit Altivec parameters are padded to 16 byte boundary.
				1791	NumBytes = ((NumBytes+15)/16)*16;
				1792	}
				1793	}
Dale Johannesen	322e3b7	2008-03-10 02:17:22 +0000	[diff] [blame]	1794	ISD::ParamFlags::ParamFlagsTy Flags =
				1795	cast<ConstantSDNode>(Op.getOperand(5+2*i+1))->getValue();
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1796	unsigned ArgSize =MVT::getSizeInBits(Op.getOperand(5+2*i).getValueType())/8;
Dale Johannesen	8be83a7	2008-03-04 23:17:14 +0000	[diff] [blame]	1797	if (Flags & ISD::ParamFlags::ByVal)
				1798	ArgSize = (Flags & ISD::ParamFlags::ByValSize) >>
				1799	ISD::ParamFlags::ByValSizeOffs;
Dale Johannesen	05b4dbc	2008-03-08 01:41:42 +0000	[diff] [blame]	1800	ArgSize = ((ArgSize + PtrByteSize - 1)/PtrByteSize) * PtrByteSize;
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1801	NumBytes += ArgSize;
				1802	}
Dale Johannesen	f6a394b	2008-03-14 17:41:26 +0000	[diff] [blame]	1803	// Allow for Altivec parameters at the end, if needed.
				1804	if (nAltivecParamsAtEnd) {
				1805	NumBytes = ((NumBytes+15)/16)*16;
				1806	NumBytes += 16*nAltivecParamsAtEnd;
				1807	}
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1808
				1809	// The prolog code of the callee may store up to 8 GPR argument registers to
				1810	// the stack, allowing va_start to index over them in memory if its varargs.
				1811	// Because we cannot tell if this is needed on the caller side, we have to
				1812	// conservatively assume that it is needed. As such, make sure we have at
				1813	// least enough stack space for the caller to store the 8 GPRs.
				1814	NumBytes = std::max(NumBytes,
				1815	PPCFrameInfo::getMinCallFrameSize(isPPC64, isMachoABI));
				1816
				1817	// Adjust the stack pointer for the new arguments...
				1818	// These operations are automatically eliminated by the prolog/epilog pass
				1819	Chain = DAG.getCALLSEQ_START(Chain,
				1820	DAG.getConstant(NumBytes, PtrVT));
Dale Johannesen	7a7aa10	2008-03-05 23:31:27 +0000	[diff] [blame]	1821	SDOperand CallSeqStart = Chain;
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1822
				1823	// Set up a copy of the stack pointer for use loading and storing any
				1824	// arguments that may not fit in the registers available for argument
				1825	// passing.
				1826	SDOperand StackPtr;
				1827	if (isPPC64)
				1828	StackPtr = DAG.getRegister(PPC::X1, MVT::i64);
				1829	else
				1830	StackPtr = DAG.getRegister(PPC::R1, MVT::i32);
				1831
				1832	// Figure out which arguments are going to go in registers, and which in
				1833	// memory. Also, if this is a vararg function, floating point operations
				1834	// must be stored to our stack, and loaded into integer regs as well, if
				1835	// any integer regs are available for argument passing.
				1836	unsigned ArgOffset = PPCFrameInfo::getLinkageSize(isPPC64, isMachoABI);
				1837	unsigned GPR_idx = 0, FPR_idx = 0, VR_idx = 0;
				1838
				1839	static const unsigned GPR_32[] = { // 32-bit registers.
				1840	PPC::R3, PPC::R4, PPC::R5, PPC::R6,
				1841	PPC::R7, PPC::R8, PPC::R9, PPC::R10,
				1842	};
				1843	static const unsigned GPR_64[] = { // 64-bit registers.
				1844	PPC::X3, PPC::X4, PPC::X5, PPC::X6,
				1845	PPC::X7, PPC::X8, PPC::X9, PPC::X10,
				1846	};
				1847	static const unsigned *FPR = GetFPR(Subtarget);
				1848
				1849	static const unsigned VR[] = {
				1850	PPC::V2, PPC::V3, PPC::V4, PPC::V5, PPC::V6, PPC::V7, PPC::V8,
				1851	PPC::V9, PPC::V10, PPC::V11, PPC::V12, PPC::V13
				1852	};
Owen Anderson	1636de9	2007-09-07 04:06:50 +0000	[diff] [blame]	1853	const unsigned NumGPRs = array_lengthof(GPR_32);
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1854	const unsigned NumFPRs = isMachoABI ? 13 : 8;
Owen Anderson	1636de9	2007-09-07 04:06:50 +0000	[diff] [blame]	1855	const unsigned NumVRs = array_lengthof( VR);
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1856
				1857	const unsigned *GPR = isPPC64 ? GPR_64 : GPR_32;
				1858
				1859	std::vector<std::pair<unsigned, SDOperand> > RegsToPass;
				1860	SmallVector<SDOperand, 8> MemOpChains;
				1861	for (unsigned i = 0; i != NumOps; ++i) {
				1862	bool inMem = false;
				1863	SDOperand Arg = Op.getOperand(5+2*i);
Dale Johannesen	322e3b7	2008-03-10 02:17:22 +0000	[diff] [blame]	1864	ISD::ParamFlags::ParamFlagsTy Flags =
				1865	cast<ConstantSDNode>(Op.getOperand(5+2*i+1))->getValue();
				1866	unsigned AlignFlag = ISD::ParamFlags::One <<
				1867	ISD::ParamFlags::OrigAlignmentOffs;
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1868	// See if next argument requires stack alignment in ELF
				1869	unsigned next = 5+2*(i+1)+1;
				1870	bool Expand = (Arg.getValueType() == MVT::f64) \|\| ((i + 1 < NumOps) &&
				1871	(cast<ConstantSDNode>(Op.getOperand(next))->getValue() & AlignFlag) &&
				1872	(!(Flags & AlignFlag)));
				1873
				1874	// PtrOff will be used to store the current argument to the stack if a
				1875	// register cannot be found for it.
				1876	SDOperand PtrOff;
				1877
				1878	// Stack align in ELF 32
				1879	if (isELF32_ABI && Expand)
				1880	PtrOff = DAG.getConstant(ArgOffset + ((ArgOffset/4) % 2) * PtrByteSize,
				1881	StackPtr.getValueType());
				1882	else
				1883	PtrOff = DAG.getConstant(ArgOffset, StackPtr.getValueType());
				1884
				1885	PtrOff = DAG.getNode(ISD::ADD, PtrVT, StackPtr, PtrOff);
				1886
				1887	// On PPC64, promote integers to 64-bit values.
				1888	if (isPPC64 && Arg.getValueType() == MVT::i32) {
				1889	unsigned ExtOp = (Flags & 1) ? ISD::SIGN_EXTEND : ISD::ZERO_EXTEND;
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1890	Arg = DAG.getNode(ExtOp, MVT::i64, Arg);
				1891	}
Dale Johannesen	8be83a7	2008-03-04 23:17:14 +0000	[diff] [blame]	1892
				1893	// FIXME Elf untested, what are alignment rules?
Dale Johannesen	eaea88c	2008-03-07 20:27:40 +0000	[diff] [blame]	1894	// FIXME memcpy is used way more than necessary. Correctness first.
Dale Johannesen	8be83a7	2008-03-04 23:17:14 +0000	[diff] [blame]	1895	if (Flags & ISD::ParamFlags::ByVal) {
				1896	unsigned Size = (Flags & ISD::ParamFlags::ByValSize) >>
				1897	ISD::ParamFlags::ByValSizeOffs;
				1898	if (isELF32_ABI && Expand) GPR_idx += (GPR_idx % 2);
Dale Johannesen	eaea88c	2008-03-07 20:27:40 +0000	[diff] [blame]	1899	if (Size==1 \|\| Size==2) {
				1900	// Very small objects are passed right-justified.
				1901	// Everything else is passed left-justified.
				1902	MVT::ValueType VT = (Size==1) ? MVT::i8 : MVT::i16;
				1903	if (GPR_idx != NumGPRs) {
				1904	SDOperand Load = DAG.getExtLoad(ISD::EXTLOAD, PtrVT, Chain, Arg,
				1905	NULL, 0, VT);
				1906	MemOpChains.push_back(Load.getValue(1));
				1907	RegsToPass.push_back(std::make_pair(GPR[GPR_idx++], Load));
				1908	if (isMachoABI)
				1909	ArgOffset += PtrByteSize;
				1910	} else {
				1911	SDOperand Const = DAG.getConstant(4 - Size, PtrOff.getValueType());
				1912	SDOperand AddPtr = DAG.getNode(ISD::ADD, PtrVT, PtrOff, Const);
				1913	SDOperand MemcpyCall = CreateCopyOfByValArgument(Arg, AddPtr,
				1914	CallSeqStart.Val->getOperand(0),
				1915	Flags, DAG, Size);
				1916	// This must go outside the CALLSEQ_START..END.
				1917	SDOperand NewCallSeqStart = DAG.getCALLSEQ_START(MemcpyCall,
				1918	CallSeqStart.Val->getOperand(1));
				1919	DAG.ReplaceAllUsesWith(CallSeqStart.Val, NewCallSeqStart.Val);
				1920	Chain = CallSeqStart = NewCallSeqStart;
				1921	ArgOffset += PtrByteSize;
				1922	}
				1923	continue;
				1924	}
Dale Johannesen	bfadf4b	2008-03-17 02:13:43 +0000	[diff] [blame^]	1925	// Copy entire object into memory. There are cases where gcc-generated
				1926	// code assumes it is there, even if it could be put entirely into
				1927	// registers. (This is not what the doc says.)
				1928	SDOperand MemcpyCall = CreateCopyOfByValArgument(Arg, PtrOff,
				1929	CallSeqStart.Val->getOperand(0),
				1930	Flags, DAG, Size);
				1931	// This must go outside the CALLSEQ_START..END.
				1932	SDOperand NewCallSeqStart = DAG.getCALLSEQ_START(MemcpyCall,
				1933	CallSeqStart.Val->getOperand(1));
				1934	DAG.ReplaceAllUsesWith(CallSeqStart.Val, NewCallSeqStart.Val);
				1935	Chain = CallSeqStart = NewCallSeqStart;
				1936	// And copy the pieces of it that fit into registers.
Dale Johannesen	8be83a7	2008-03-04 23:17:14 +0000	[diff] [blame]	1937	for (unsigned j=0; j<Size; j+=PtrByteSize) {
				1938	SDOperand Const = DAG.getConstant(j, PtrOff.getValueType());
				1939	SDOperand AddArg = DAG.getNode(ISD::ADD, PtrVT, Arg, Const);
				1940	if (GPR_idx != NumGPRs) {
				1941	SDOperand Load = DAG.getLoad(PtrVT, Chain, AddArg, NULL, 0);
Dale Johannesen	7a7aa10	2008-03-05 23:31:27 +0000	[diff] [blame]	1942	MemOpChains.push_back(Load.getValue(1));
Dale Johannesen	8be83a7	2008-03-04 23:17:14 +0000	[diff] [blame]	1943	RegsToPass.push_back(std::make_pair(GPR[GPR_idx++], Load));
				1944	if (isMachoABI)
				1945	ArgOffset += PtrByteSize;
				1946	} else {
Dale Johannesen	bfadf4b	2008-03-17 02:13:43 +0000	[diff] [blame^]	1947	ArgOffset += ((Size - j + PtrByteSize-1)/PtrByteSize)*PtrByteSize;
Dale Johannesen	eaea88c	2008-03-07 20:27:40 +0000	[diff] [blame]	1948	break;
Dale Johannesen	8be83a7	2008-03-04 23:17:14 +0000	[diff] [blame]	1949	}
				1950	}
				1951	continue;
				1952	}
				1953
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1954	switch (Arg.getValueType()) {
				1955	default: assert(0 && "Unexpected ValueType for argument!");
				1956	case MVT::i32:
				1957	case MVT::i64:
				1958	// Double word align in ELF
				1959	if (isELF32_ABI && Expand) GPR_idx += (GPR_idx % 2);
				1960	if (GPR_idx != NumGPRs) {
				1961	RegsToPass.push_back(std::make_pair(GPR[GPR_idx++], Arg));
				1962	} else {
				1963	MemOpChains.push_back(DAG.getStore(Chain, Arg, PtrOff, NULL, 0));
				1964	inMem = true;
				1965	}
				1966	if (inMem \|\| isMachoABI) {
				1967	// Stack align in ELF
				1968	if (isELF32_ABI && Expand)
				1969	ArgOffset += ((ArgOffset/4) % 2) * PtrByteSize;
				1970
				1971	ArgOffset += PtrByteSize;
				1972	}
				1973	break;
				1974	case MVT::f32:
				1975	case MVT::f64:
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	1976	if (FPR_idx != NumFPRs) {
				1977	RegsToPass.push_back(std::make_pair(FPR[FPR_idx++], Arg));
				1978
				1979	if (isVarArg) {
				1980	SDOperand Store = DAG.getStore(Chain, Arg, PtrOff, NULL, 0);
				1981	MemOpChains.push_back(Store);
				1982
				1983	// Float varargs are always shadowed in available integer registers
				1984	if (GPR_idx != NumGPRs) {
				1985	SDOperand Load = DAG.getLoad(PtrVT, Store, PtrOff, NULL, 0);
				1986	MemOpChains.push_back(Load.getValue(1));
				1987	if (isMachoABI) RegsToPass.push_back(std::make_pair(GPR[GPR_idx++],
				1988	Load));
				1989	}
				1990	if (GPR_idx != NumGPRs && Arg.getValueType() == MVT::f64 && !isPPC64){
				1991	SDOperand ConstFour = DAG.getConstant(4, PtrOff.getValueType());
				1992	PtrOff = DAG.getNode(ISD::ADD, PtrVT, PtrOff, ConstFour);
				1993	SDOperand Load = DAG.getLoad(PtrVT, Store, PtrOff, NULL, 0);
				1994	MemOpChains.push_back(Load.getValue(1));
				1995	if (isMachoABI) RegsToPass.push_back(std::make_pair(GPR[GPR_idx++],
				1996	Load));
				1997	}
				1998	} else {
				1999	// If we have any FPRs remaining, we may also have GPRs remaining.
				2000	// Args passed in FPRs consume either 1 (f32) or 2 (f64) available
				2001	// GPRs.
				2002	if (isMachoABI) {
				2003	if (GPR_idx != NumGPRs)
				2004	++GPR_idx;
				2005	if (GPR_idx != NumGPRs && Arg.getValueType() == MVT::f64 &&
				2006	!isPPC64) // PPC64 has 64-bit GPR's obviously :)
				2007	++GPR_idx;
				2008	}
				2009	}
				2010	} else {
				2011	MemOpChains.push_back(DAG.getStore(Chain, Arg, PtrOff, NULL, 0));
				2012	inMem = true;
				2013	}
				2014	if (inMem \|\| isMachoABI) {
				2015	// Stack align in ELF
				2016	if (isELF32_ABI && Expand)
				2017	ArgOffset += ((ArgOffset/4) % 2) * PtrByteSize;
				2018	if (isPPC64)
				2019	ArgOffset += 8;
				2020	else
				2021	ArgOffset += Arg.getValueType() == MVT::f32 ? 4 : 8;
				2022	}
				2023	break;
				2024	case MVT::v4f32:
				2025	case MVT::v4i32:
				2026	case MVT::v8i16:
				2027	case MVT::v16i8:
Dale Johannesen	946b9cc	2008-03-12 00:22:17 +0000	[diff] [blame]	2028	if (isVarArg) {
				2029	// These go aligned on the stack, or in the corresponding R registers
				2030	// when within range. The Darwin PPC ABI doc claims they also go in
				2031	// V registers; in fact gcc does this only for arguments that are
				2032	// prototyped, not for those that match the ... We do it for all
				2033	// arguments, seems to work.
				2034	while (ArgOffset % 16 !=0) {
				2035	ArgOffset += PtrByteSize;
				2036	if (GPR_idx != NumGPRs)
				2037	GPR_idx++;
				2038	}
				2039	// We could elide this store in the case where the object fits
				2040	// entirely in R registers. Maybe later.
				2041	PtrOff = DAG.getNode(ISD::ADD, PtrVT, StackPtr,
				2042	DAG.getConstant(ArgOffset, PtrVT));
				2043	SDOperand Store = DAG.getStore(Chain, Arg, PtrOff, NULL, 0);
				2044	MemOpChains.push_back(Store);
				2045	if (VR_idx != NumVRs) {
				2046	SDOperand Load = DAG.getLoad(MVT::v4f32, Store, PtrOff, NULL, 0);
				2047	MemOpChains.push_back(Load.getValue(1));
				2048	RegsToPass.push_back(std::make_pair(VR[VR_idx++], Load));
				2049	}
				2050	ArgOffset += 16;
				2051	for (unsigned i=0; i<16; i+=PtrByteSize) {
				2052	if (GPR_idx == NumGPRs)
				2053	break;
				2054	SDOperand Ix = DAG.getNode(ISD::ADD, PtrVT, PtrOff,
				2055	DAG.getConstant(i, PtrVT));
				2056	SDOperand Load = DAG.getLoad(PtrVT, Store, Ix, NULL, 0);
				2057	MemOpChains.push_back(Load.getValue(1));
				2058	RegsToPass.push_back(std::make_pair(GPR[GPR_idx++], Load));
				2059	}
				2060	break;
				2061	}
Dale Johannesen	f6a394b	2008-03-14 17:41:26 +0000	[diff] [blame]	2062	// Non-varargs Altivec params generally go in registers, but have
				2063	// stack space allocated at the end.
				2064	if (VR_idx != NumVRs) {
				2065	// Doesn't have GPR space allocated.
				2066	RegsToPass.push_back(std::make_pair(VR[VR_idx++], Arg));
				2067	} else if (nAltivecParamsAtEnd==0) {
				2068	// We are emitting Altivec params in order.
Dale Johannesen	946b9cc	2008-03-12 00:22:17 +0000	[diff] [blame]	2069	PtrOff = DAG.getNode(ISD::ADD, PtrVT, StackPtr,
				2070	DAG.getConstant(ArgOffset, PtrVT));
				2071	SDOperand Store = DAG.getStore(Chain, Arg, PtrOff, NULL, 0);
				2072	MemOpChains.push_back(Store);
				2073	ArgOffset += 16;
Dale Johannesen	946b9cc	2008-03-12 00:22:17 +0000	[diff] [blame]	2074	}
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	2075	break;
				2076	}
				2077	}
Dale Johannesen	f6a394b	2008-03-14 17:41:26 +0000	[diff] [blame]	2078	// If all Altivec parameters fit in registers, as they usually do,
				2079	// they get stack space following the non-Altivec parameters. We
				2080	// don't track this here because nobody below needs it.
				2081	// If there are more Altivec parameters than fit in registers emit
				2082	// the stores here.
				2083	if (!isVarArg && nAltivecParamsAtEnd > NumVRs) {
				2084	unsigned j = 0;
				2085	// Offset is aligned; skip 1st 12 params which go in V registers.
				2086	ArgOffset = ((ArgOffset+15)/16)*16;
				2087	ArgOffset += 12*16;
				2088	for (unsigned i = 0; i != NumOps; ++i) {
				2089	SDOperand Arg = Op.getOperand(5+2*i);
				2090	MVT::ValueType ArgType = Arg.getValueType();
				2091	if (ArgType==MVT::v4f32 \|\| ArgType==MVT::v4i32 \|\|
				2092	ArgType==MVT::v8i16 \|\| ArgType==MVT::v16i8) {
				2093	if (++j > NumVRs) {
				2094	SDOperand PtrOff = DAG.getNode(ISD::ADD, PtrVT, StackPtr,
				2095	DAG.getConstant(ArgOffset, PtrVT));
				2096	SDOperand Store = DAG.getStore(Chain, Arg, PtrOff, NULL, 0);
				2097	MemOpChains.push_back(Store);
				2098	ArgOffset += 16;
				2099	}
				2100	}
				2101	}
				2102	}
				2103
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	2104	if (!MemOpChains.empty())
				2105	Chain = DAG.getNode(ISD::TokenFactor, MVT::Other,
				2106	&MemOpChains[0], MemOpChains.size());
				2107
				2108	// Build a sequence of copy-to-reg nodes chained together with token chain
				2109	// and flag operands which copy the outgoing args into the appropriate regs.
				2110	SDOperand InFlag;
				2111	for (unsigned i = 0, e = RegsToPass.size(); i != e; ++i) {
				2112	Chain = DAG.getCopyToReg(Chain, RegsToPass[i].first, RegsToPass[i].second,
				2113	InFlag);
				2114	InFlag = Chain.getValue(1);
				2115	}
				2116
				2117	// With the ELF 32 ABI, set CR6 to true if this is a vararg call.
				2118	if (isVarArg && isELF32_ABI) {
Nicolas Geoffray	d01feb2	2008-03-10 14:12:10 +0000	[diff] [blame]	2119	SDOperand SetCR(DAG.getTargetNode(PPC::CRSET, MVT::i32), 0);
				2120	Chain = DAG.getCopyToReg(Chain, PPC::CR1EQ, SetCR, InFlag);
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	2121	InFlag = Chain.getValue(1);
				2122	}
				2123
				2124	std::vector<MVT::ValueType> NodeTys;
				2125	NodeTys.push_back(MVT::Other); // Returns a chain
				2126	NodeTys.push_back(MVT::Flag); // Returns a flag for retval copy to use.
				2127
				2128	SmallVector<SDOperand, 8> Ops;
				2129	unsigned CallOpc = isMachoABI? PPCISD::CALL_Macho : PPCISD::CALL_ELF;
				2130
				2131	// If the callee is a GlobalAddress/ExternalSymbol node (quite common, every
				2132	// direct call is) turn it into a TargetGlobalAddress/TargetExternalSymbol
				2133	// node so that legalize doesn't hack it.
Nicolas Geoffray	455a2e0	2007-12-21 12:22:29 +0000	[diff] [blame]	2134	if (GlobalAddressSDNode *G = dyn_cast<GlobalAddressSDNode>(Callee))
				2135	Callee = DAG.getTargetGlobalAddress(G->getGlobal(), Callee.getValueType());
				2136	else if (ExternalSymbolSDNode *S = dyn_cast<ExternalSymbolSDNode>(Callee))
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	2137	Callee = DAG.getTargetExternalSymbol(S->getSymbol(), Callee.getValueType());
				2138	else if (SDNode *Dest = isBLACompatibleAddress(Callee, DAG))
				2139	// If this is an absolute destination address, use the munged value.
				2140	Callee = SDOperand(Dest, 0);
				2141	else {
				2142	// Otherwise, this is an indirect call. We have to use a MTCTR/BCTRL pair
				2143	// to do the call, we can't use PPCISD::CALL.
				2144	SDOperand MTCTROps[] = {Chain, Callee, InFlag};
				2145	Chain = DAG.getNode(PPCISD::MTCTR, NodeTys, MTCTROps, 2+(InFlag.Val!=0));
				2146	InFlag = Chain.getValue(1);
				2147
Chris Lattner	6eae8c6	2008-03-09 20:49:33 +0000	[diff] [blame]	2148	// Copy the callee address into R12/X12 on darwin.
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	2149	if (isMachoABI) {
Chris Lattner	6eae8c6	2008-03-09 20:49:33 +0000	[diff] [blame]	2150	unsigned Reg = Callee.getValueType() == MVT::i32 ? PPC::R12 : PPC::X12;
				2151	Chain = DAG.getCopyToReg(Chain, Reg, Callee, InFlag);
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	2152	InFlag = Chain.getValue(1);
				2153	}
				2154
				2155	NodeTys.clear();
				2156	NodeTys.push_back(MVT::Other);
				2157	NodeTys.push_back(MVT::Flag);
				2158	Ops.push_back(Chain);
				2159	CallOpc = isMachoABI ? PPCISD::BCTRL_Macho : PPCISD::BCTRL_ELF;
				2160	Callee.Val = 0;
				2161	}
				2162
				2163	// If this is a direct call, pass the chain and the callee.
				2164	if (Callee.Val) {
				2165	Ops.push_back(Chain);
				2166	Ops.push_back(Callee);
				2167	}
				2168
				2169	// Add argument registers to the end of the list so that they are known live
				2170	// into the call.
				2171	for (unsigned i = 0, e = RegsToPass.size(); i != e; ++i)
				2172	Ops.push_back(DAG.getRegister(RegsToPass[i].first,
				2173	RegsToPass[i].second.getValueType()));
				2174
				2175	if (InFlag.Val)
				2176	Ops.push_back(InFlag);
				2177	Chain = DAG.getNode(CallOpc, NodeTys, &Ops[0], Ops.size());
				2178	InFlag = Chain.getValue(1);
				2179
Bill Wendling	22f8deb	2007-11-13 00:44:25 +0000	[diff] [blame]	2180	Chain = DAG.getCALLSEQ_END(Chain,
				2181	DAG.getConstant(NumBytes, PtrVT),
				2182	DAG.getConstant(0, PtrVT),
				2183	InFlag);
				2184	if (Op.Val->getValueType(0) != MVT::Other)
				2185	InFlag = Chain.getValue(1);
				2186
Dale Johannesen	bfadf4b	2008-03-17 02:13:43 +0000	[diff] [blame^]	2187	SDOperand ResultVals[9];
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	2188	unsigned NumResults = 0;
				2189	NodeTys.clear();
				2190
				2191	// If the call has results, copy the values out of the ret val registers.
				2192	switch (Op.Val->getValueType(0)) {
				2193	default: assert(0 && "Unexpected ret value!");
				2194	case MVT::Other: break;
				2195	case MVT::i32:
Dale Johannesen	bfadf4b	2008-03-17 02:13:43 +0000	[diff] [blame^]	2196	// There are 8 result regs for Complex double, and 4 for Complex long long.
				2197	if (Op.Val->getNumValues()>=8 && Op.Val->getValueType(7) == MVT::i32) {
				2198	Chain = DAG.getCopyFromReg(Chain, PPC::R3, MVT::i32, InFlag).getValue(1);
				2199	ResultVals[0] = Chain.getValue(0);
				2200	Chain = DAG.getCopyFromReg(Chain, PPC::R4, MVT::i32,
				2201	Chain.getValue(2)).getValue(1);
				2202	ResultVals[1] = Chain.getValue(0);
				2203	Chain = DAG.getCopyFromReg(Chain, PPC::R5, MVT::i32,
				2204	Chain.getValue(2)).getValue(1);
				2205	ResultVals[2] = Chain.getValue(0);
				2206	Chain = DAG.getCopyFromReg(Chain, PPC::R6, MVT::i32,
				2207	Chain.getValue(2)).getValue(1);
				2208	ResultVals[3] = Chain.getValue(0);
				2209	Chain = DAG.getCopyFromReg(Chain, PPC::R7, MVT::i32,
				2210	Chain.getValue(2)).getValue(1);
				2211	ResultVals[4] = Chain.getValue(0);
				2212	Chain = DAG.getCopyFromReg(Chain, PPC::R8, MVT::i32,
				2213	Chain.getValue(2)).getValue(1);
				2214	ResultVals[5] = Chain.getValue(0);
				2215	Chain = DAG.getCopyFromReg(Chain, PPC::R9, MVT::i32,
				2216	Chain.getValue(2)).getValue(1);
				2217	ResultVals[6] = Chain.getValue(0);
				2218	Chain = DAG.getCopyFromReg(Chain, PPC::R10, MVT::i32,
				2219	Chain.getValue(2)).getValue(1);
				2220	ResultVals[7] = Chain.getValue(0);
				2221	NumResults = 8;
				2222	NodeTys.push_back(MVT::i32);
				2223	NodeTys.push_back(MVT::i32);
				2224	NodeTys.push_back(MVT::i32);
				2225	NodeTys.push_back(MVT::i32);
				2226	NodeTys.push_back(MVT::i32);
				2227	NodeTys.push_back(MVT::i32);
				2228	NodeTys.push_back(MVT::i32);
				2229	} else if (Op.Val->getNumValues()>=4 &&
				2230	Op.Val->getValueType(3) == MVT::i32) {
				2231	Chain = DAG.getCopyFromReg(Chain, PPC::R3, MVT::i32, InFlag).getValue(1);
				2232	ResultVals[0] = Chain.getValue(0);
				2233	Chain = DAG.getCopyFromReg(Chain, PPC::R4, MVT::i32,
				2234	Chain.getValue(2)).getValue(1);
				2235	ResultVals[1] = Chain.getValue(0);
				2236	Chain = DAG.getCopyFromReg(Chain, PPC::R5, MVT::i32,
				2237	Chain.getValue(2)).getValue(1);
				2238	ResultVals[2] = Chain.getValue(0);
				2239	Chain = DAG.getCopyFromReg(Chain, PPC::R6, MVT::i32,
				2240	Chain.getValue(2)).getValue(1);
				2241	ResultVals[3] = Chain.getValue(0);
				2242	NumResults = 4;
				2243	NodeTys.push_back(MVT::i32);
				2244	NodeTys.push_back(MVT::i32);
				2245	NodeTys.push_back(MVT::i32);
				2246	} else if (Op.Val->getValueType(1) == MVT::i32) {
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	2247	Chain = DAG.getCopyFromReg(Chain, PPC::R3, MVT::i32, InFlag).getValue(1);
				2248	ResultVals[0] = Chain.getValue(0);
				2249	Chain = DAG.getCopyFromReg(Chain, PPC::R4, MVT::i32,
				2250	Chain.getValue(2)).getValue(1);
				2251	ResultVals[1] = Chain.getValue(0);
				2252	NumResults = 2;
				2253	NodeTys.push_back(MVT::i32);
				2254	} else {
				2255	Chain = DAG.getCopyFromReg(Chain, PPC::R3, MVT::i32, InFlag).getValue(1);
				2256	ResultVals[0] = Chain.getValue(0);
				2257	NumResults = 1;
				2258	}
				2259	NodeTys.push_back(MVT::i32);
				2260	break;
				2261	case MVT::i64:
Dan Gohman	fe65bda	2008-03-08 00:19:12 +0000	[diff] [blame]	2262	if (Op.Val->getValueType(1) == MVT::i64) {
				2263	Chain = DAG.getCopyFromReg(Chain, PPC::X3, MVT::i64, InFlag).getValue(1);
				2264	ResultVals[0] = Chain.getValue(0);
				2265	Chain = DAG.getCopyFromReg(Chain, PPC::X4, MVT::i64,
				2266	Chain.getValue(2)).getValue(1);
				2267	ResultVals[1] = Chain.getValue(0);
				2268	NumResults = 2;
				2269	NodeTys.push_back(MVT::i64);
				2270	} else {
				2271	Chain = DAG.getCopyFromReg(Chain, PPC::X3, MVT::i64, InFlag).getValue(1);
				2272	ResultVals[0] = Chain.getValue(0);
				2273	NumResults = 1;
				2274	}
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	2275	NodeTys.push_back(MVT::i64);
				2276	break;
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	2277	case MVT::f64:
Dale Johannesen	ac77b27	2007-10-05 20:04:43 +0000	[diff] [blame]	2278	if (Op.Val->getValueType(1) == MVT::f64) {
				2279	Chain = DAG.getCopyFromReg(Chain, PPC::F1, MVT::f64, InFlag).getValue(1);
				2280	ResultVals[0] = Chain.getValue(0);
				2281	Chain = DAG.getCopyFromReg(Chain, PPC::F2, MVT::f64,
				2282	Chain.getValue(2)).getValue(1);
				2283	ResultVals[1] = Chain.getValue(0);
				2284	NumResults = 2;
				2285	NodeTys.push_back(MVT::f64);
				2286	NodeTys.push_back(MVT::f64);
				2287	break;
				2288	}
				2289	// else fall through
				2290	case MVT::f32:
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	2291	Chain = DAG.getCopyFromReg(Chain, PPC::F1, Op.Val->getValueType(0),
				2292	InFlag).getValue(1);
				2293	ResultVals[0] = Chain.getValue(0);
				2294	NumResults = 1;
				2295	NodeTys.push_back(Op.Val->getValueType(0));
				2296	break;
				2297	case MVT::v4f32:
				2298	case MVT::v4i32:
				2299	case MVT::v8i16:
				2300	case MVT::v16i8:
				2301	Chain = DAG.getCopyFromReg(Chain, PPC::V2, Op.Val->getValueType(0),
				2302	InFlag).getValue(1);
				2303	ResultVals[0] = Chain.getValue(0);
				2304	NumResults = 1;
				2305	NodeTys.push_back(Op.Val->getValueType(0));
				2306	break;
				2307	}
				2308
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	2309	NodeTys.push_back(MVT::Other);
				2310
				2311	// If the function returns void, just return the chain.
				2312	if (NumResults == 0)
				2313	return Chain;
				2314
				2315	// Otherwise, merge everything together with a MERGE_VALUES node.
				2316	ResultVals[NumResults++] = Chain;
				2317	SDOperand Res = DAG.getNode(ISD::MERGE_VALUES, NodeTys,
				2318	ResultVals, NumResults);
				2319	return Res.getValue(Op.ResNo);
				2320	}
				2321
Dale Johannesen	8be83a7	2008-03-04 23:17:14 +0000	[diff] [blame]	2322	SDOperand PPCTargetLowering::LowerRET(SDOperand Op, SelectionDAG &DAG,
				2323	TargetMachine &TM) {
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	2324	SmallVector<CCValAssign, 16> RVLocs;
				2325	unsigned CC = DAG.getMachineFunction().getFunction()->getCallingConv();
				2326	bool isVarArg = DAG.getMachineFunction().getFunction()->isVarArg();
				2327	CCState CCInfo(CC, isVarArg, TM, RVLocs);
				2328	CCInfo.AnalyzeReturn(Op.Val, RetCC_PPC);
				2329
				2330	// If this is the first return lowered for this function, add the regs to the
				2331	// liveout set for the function.
Chris Lattner	1b98919	2007-12-31 04:13:23 +0000	[diff] [blame]	2332	if (DAG.getMachineFunction().getRegInfo().liveout_empty()) {
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	2333	for (unsigned i = 0; i != RVLocs.size(); ++i)
Chris Lattner	1b98919	2007-12-31 04:13:23 +0000	[diff] [blame]	2334	DAG.getMachineFunction().getRegInfo().addLiveOut(RVLocs[i].getLocReg());
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	2335	}
				2336
				2337	SDOperand Chain = Op.getOperand(0);
				2338	SDOperand Flag;
				2339
				2340	// Copy the result values into the output registers.
				2341	for (unsigned i = 0; i != RVLocs.size(); ++i) {
				2342	CCValAssign &VA = RVLocs[i];
				2343	assert(VA.isRegLoc() && "Can only return in registers!");
				2344	Chain = DAG.getCopyToReg(Chain, VA.getLocReg(), Op.getOperand(i*2+1), Flag);
				2345	Flag = Chain.getValue(1);
				2346	}
				2347
				2348	if (Flag.Val)
				2349	return DAG.getNode(PPCISD::RET_FLAG, MVT::Other, Chain, Flag);
				2350	else
				2351	return DAG.getNode(PPCISD::RET_FLAG, MVT::Other, Chain);
				2352	}
				2353
Dale Johannesen	8be83a7	2008-03-04 23:17:14 +0000	[diff] [blame]	2354	SDOperand PPCTargetLowering::LowerSTACKRESTORE(SDOperand Op, SelectionDAG &DAG,
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	2355	const PPCSubtarget &Subtarget) {
				2356	// When we pop the dynamic allocation we need to restore the SP link.
				2357
				2358	// Get the corect type for pointers.
				2359	MVT::ValueType PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
				2360
				2361	// Construct the stack pointer operand.
				2362	bool IsPPC64 = Subtarget.isPPC64();
				2363	unsigned SP = IsPPC64 ? PPC::X1 : PPC::R1;
				2364	SDOperand StackPtr = DAG.getRegister(SP, PtrVT);
				2365
				2366	// Get the operands for the STACKRESTORE.
				2367	SDOperand Chain = Op.getOperand(0);
				2368	SDOperand SaveSP = Op.getOperand(1);
				2369
				2370	// Load the old link SP.
				2371	SDOperand LoadLinkSP = DAG.getLoad(PtrVT, Chain, StackPtr, NULL, 0);
				2372
				2373	// Restore the stack pointer.
				2374	Chain = DAG.getCopyToReg(LoadLinkSP.getValue(1), SP, SaveSP);
				2375
				2376	// Store the old link SP.
				2377	return DAG.getStore(Chain, LoadLinkSP, StackPtr, NULL, 0);
				2378	}
				2379
Dale Johannesen	8be83a7	2008-03-04 23:17:14 +0000	[diff] [blame]	2380	SDOperand PPCTargetLowering::LowerDYNAMIC_STACKALLOC(SDOperand Op,
				2381	SelectionDAG &DAG,
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	2382	const PPCSubtarget &Subtarget) {
				2383	MachineFunction &MF = DAG.getMachineFunction();
				2384	bool IsPPC64 = Subtarget.isPPC64();
				2385	bool isMachoABI = Subtarget.isMachoABI();
				2386
				2387	// Get current frame pointer save index. The users of this index will be
				2388	// primarily DYNALLOC instructions.
				2389	PPCFunctionInfo *FI = MF.getInfo<PPCFunctionInfo>();
				2390	int FPSI = FI->getFramePointerSaveIndex();
				2391
				2392	// If the frame pointer save index hasn't been defined yet.
				2393	if (!FPSI) {
				2394	// Find out what the fix offset of the frame pointer save area.
				2395	int FPOffset = PPCFrameInfo::getFramePointerSaveOffset(IsPPC64, isMachoABI);
				2396
				2397	// Allocate the frame index for frame pointer save area.
				2398	FPSI = MF.getFrameInfo()->CreateFixedObject(IsPPC64? 8 : 4, FPOffset);
				2399	// Save the result.
				2400	FI->setFramePointerSaveIndex(FPSI);
				2401	}
				2402
				2403	// Get the inputs.
				2404	SDOperand Chain = Op.getOperand(0);
				2405	SDOperand Size = Op.getOperand(1);
				2406
				2407	// Get the corect type for pointers.
				2408	MVT::ValueType PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
				2409	// Negate the size.
				2410	SDOperand NegSize = DAG.getNode(ISD::SUB, PtrVT,
				2411	DAG.getConstant(0, PtrVT), Size);
				2412	// Construct a node for the frame pointer save index.
				2413	SDOperand FPSIdx = DAG.getFrameIndex(FPSI, PtrVT);
				2414	// Build a DYNALLOC node.
				2415	SDOperand Ops[3] = { Chain, NegSize, FPSIdx };
				2416	SDVTList VTs = DAG.getVTList(PtrVT, MVT::Other);
				2417	return DAG.getNode(PPCISD::DYNALLOC, VTs, Ops, 3);
				2418	}
				2419
				2420
				2421	/// LowerSELECT_CC - Lower floating point select_cc's into fsel instruction when
				2422	/// possible.
Dale Johannesen	8be83a7	2008-03-04 23:17:14 +0000	[diff] [blame]	2423	SDOperand PPCTargetLowering::LowerSELECT_CC(SDOperand Op, SelectionDAG &DAG) {
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	2424	// Not FP? Not a fsel.
				2425	if (!MVT::isFloatingPoint(Op.getOperand(0).getValueType()) \|\|
				2426	!MVT::isFloatingPoint(Op.getOperand(2).getValueType()))
				2427	return SDOperand();
				2428
				2429	ISD::CondCode CC = cast<CondCodeSDNode>(Op.getOperand(4))->get();
				2430
				2431	// Cannot handle SETEQ/SETNE.
				2432	if (CC == ISD::SETEQ \|\| CC == ISD::SETNE) return SDOperand();
				2433
				2434	MVT::ValueType ResVT = Op.getValueType();
				2435	MVT::ValueType CmpVT = Op.getOperand(0).getValueType();
				2436	SDOperand LHS = Op.getOperand(0), RHS = Op.getOperand(1);
				2437	SDOperand TV = Op.getOperand(2), FV = Op.getOperand(3);
				2438
				2439	// If the RHS of the comparison is a 0.0, we don't need to do the
				2440	// subtraction at all.
				2441	if (isFloatingPointZero(RHS))
				2442	switch (CC) {
				2443	default: break; // SETUO etc aren't handled by fsel.
				2444	case ISD::SETULT:
				2445	case ISD::SETOLT:
				2446	case ISD::SETLT:
				2447	std::swap(TV, FV); // fsel is natively setge, swap operands for setlt
				2448	case ISD::SETUGE:
				2449	case ISD::SETOGE:
				2450	case ISD::SETGE:
				2451	if (LHS.getValueType() == MVT::f32) // Comparison is always 64-bits
				2452	LHS = DAG.getNode(ISD::FP_EXTEND, MVT::f64, LHS);
				2453	return DAG.getNode(PPCISD::FSEL, ResVT, LHS, TV, FV);
				2454	case ISD::SETUGT:
				2455	case ISD::SETOGT:
				2456	case ISD::SETGT:
				2457	std::swap(TV, FV); // fsel is natively setge, swap operands for setlt
				2458	case ISD::SETULE:
				2459	case ISD::SETOLE:
				2460	case ISD::SETLE:
				2461	if (LHS.getValueType() == MVT::f32) // Comparison is always 64-bits
				2462	LHS = DAG.getNode(ISD::FP_EXTEND, MVT::f64, LHS);
				2463	return DAG.getNode(PPCISD::FSEL, ResVT,
				2464	DAG.getNode(ISD::FNEG, MVT::f64, LHS), TV, FV);
				2465	}
				2466
Chris Lattner	a216bee	2007-10-15 20:14:52 +0000	[diff] [blame]	2467	SDOperand Cmp;
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	2468	switch (CC) {
				2469	default: break; // SETUO etc aren't handled by fsel.
				2470	case ISD::SETULT:
				2471	case ISD::SETOLT:
				2472	case ISD::SETLT:
				2473	Cmp = DAG.getNode(ISD::FSUB, CmpVT, LHS, RHS);
				2474	if (Cmp.getValueType() == MVT::f32) // Comparison is always 64-bits
				2475	Cmp = DAG.getNode(ISD::FP_EXTEND, MVT::f64, Cmp);
				2476	return DAG.getNode(PPCISD::FSEL, ResVT, Cmp, FV, TV);
				2477	case ISD::SETUGE:
				2478	case ISD::SETOGE:
				2479	case ISD::SETGE:
				2480	Cmp = DAG.getNode(ISD::FSUB, CmpVT, LHS, RHS);
				2481	if (Cmp.getValueType() == MVT::f32) // Comparison is always 64-bits
				2482	Cmp = DAG.getNode(ISD::FP_EXTEND, MVT::f64, Cmp);
				2483	return DAG.getNode(PPCISD::FSEL, ResVT, Cmp, TV, FV);
				2484	case ISD::SETUGT:
				2485	case ISD::SETOGT:
				2486	case ISD::SETGT:
				2487	Cmp = DAG.getNode(ISD::FSUB, CmpVT, RHS, LHS);
				2488	if (Cmp.getValueType() == MVT::f32) // Comparison is always 64-bits
				2489	Cmp = DAG.getNode(ISD::FP_EXTEND, MVT::f64, Cmp);
				2490	return DAG.getNode(PPCISD::FSEL, ResVT, Cmp, FV, TV);
				2491	case ISD::SETULE:
				2492	case ISD::SETOLE:
				2493	case ISD::SETLE:
				2494	Cmp = DAG.getNode(ISD::FSUB, CmpVT, RHS, LHS);
				2495	if (Cmp.getValueType() == MVT::f32) // Comparison is always 64-bits
				2496	Cmp = DAG.getNode(ISD::FP_EXTEND, MVT::f64, Cmp);
				2497	return DAG.getNode(PPCISD::FSEL, ResVT, Cmp, TV, FV);
				2498	}
				2499	return SDOperand();
				2500	}
				2501
Chris Lattner	2877109	2007-11-28 18:44:47 +0000	[diff] [blame]	2502	// FIXME: Split this code up when LegalizeDAGTypes lands.
Dale Johannesen	8be83a7	2008-03-04 23:17:14 +0000	[diff] [blame]	2503	SDOperand PPCTargetLowering::LowerFP_TO_SINT(SDOperand Op, SelectionDAG &DAG) {
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	2504	assert(MVT::isFloatingPoint(Op.getOperand(0).getValueType()));
				2505	SDOperand Src = Op.getOperand(0);
				2506	if (Src.getValueType() == MVT::f32)
				2507	Src = DAG.getNode(ISD::FP_EXTEND, MVT::f64, Src);
				2508
				2509	SDOperand Tmp;
				2510	switch (Op.getValueType()) {
				2511	default: assert(0 && "Unhandled FP_TO_SINT type in custom expander!");
				2512	case MVT::i32:
				2513	Tmp = DAG.getNode(PPCISD::FCTIWZ, MVT::f64, Src);
				2514	break;
				2515	case MVT::i64:
				2516	Tmp = DAG.getNode(PPCISD::FCTIDZ, MVT::f64, Src);
				2517	break;
				2518	}
				2519
				2520	// Convert the FP value to an int value through memory.
Chris Lattner	a216bee	2007-10-15 20:14:52 +0000	[diff] [blame]	2521	SDOperand FIPtr = DAG.CreateStackTemporary(MVT::f64);
				2522
				2523	// Emit a store to the stack slot.
				2524	SDOperand Chain = DAG.getStore(DAG.getEntryNode(), Tmp, FIPtr, NULL, 0);
				2525
				2526	// Result is a load from the stack slot. If loading 4 bytes, make sure to
				2527	// add in a bias.
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	2528	if (Op.getValueType() == MVT::i32)
Chris Lattner	a216bee	2007-10-15 20:14:52 +0000	[diff] [blame]	2529	FIPtr = DAG.getNode(ISD::ADD, FIPtr.getValueType(), FIPtr,
				2530	DAG.getConstant(4, FIPtr.getValueType()));
				2531	return DAG.getLoad(Op.getValueType(), Chain, FIPtr, NULL, 0);
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	2532	}
				2533
Dale Johannesen	8be83a7	2008-03-04 23:17:14 +0000	[diff] [blame]	2534	SDOperand PPCTargetLowering::LowerFP_ROUND_INREG(SDOperand Op,
				2535	SelectionDAG &DAG) {
Dale Johannesen	3d8578b	2007-10-10 01:01:31 +0000	[diff] [blame]	2536	assert(Op.getValueType() == MVT::ppcf128);
				2537	SDNode *Node = Op.Val;
				2538	assert(Node->getOperand(0).getValueType() == MVT::ppcf128);
Chris Lattner	c882caf	2007-10-19 04:08:28 +0000	[diff] [blame]	2539	assert(Node->getOperand(0).Val->getOpcode() == ISD::BUILD_PAIR);
Dale Johannesen	3d8578b	2007-10-10 01:01:31 +0000	[diff] [blame]	2540	SDOperand Lo = Node->getOperand(0).Val->getOperand(0);
				2541	SDOperand Hi = Node->getOperand(0).Val->getOperand(1);
				2542
				2543	// This sequence changes FPSCR to do round-to-zero, adds the two halves
				2544	// of the long double, and puts FPSCR back the way it was. We do not
				2545	// actually model FPSCR.
				2546	std::vector<MVT::ValueType> NodeTys;
				2547	SDOperand Ops[4], Result, MFFSreg, InFlag, FPreg;
				2548
				2549	NodeTys.push_back(MVT::f64); // Return register
				2550	NodeTys.push_back(MVT::Flag); // Returns a flag for later insns
				2551	Result = DAG.getNode(PPCISD::MFFS, NodeTys, &InFlag, 0);
				2552	MFFSreg = Result.getValue(0);
				2553	InFlag = Result.getValue(1);
				2554
				2555	NodeTys.clear();
				2556	NodeTys.push_back(MVT::Flag); // Returns a flag
				2557	Ops[0] = DAG.getConstant(31, MVT::i32);
				2558	Ops[1] = InFlag;
				2559	Result = DAG.getNode(PPCISD::MTFSB1, NodeTys, Ops, 2);
				2560	InFlag = Result.getValue(0);
				2561
				2562	NodeTys.clear();
				2563	NodeTys.push_back(MVT::Flag); // Returns a flag
				2564	Ops[0] = DAG.getConstant(30, MVT::i32);
				2565	Ops[1] = InFlag;
				2566	Result = DAG.getNode(PPCISD::MTFSB0, NodeTys, Ops, 2);
				2567	InFlag = Result.getValue(0);
				2568
				2569	NodeTys.clear();
				2570	NodeTys.push_back(MVT::f64); // result of add
				2571	NodeTys.push_back(MVT::Flag); // Returns a flag
				2572	Ops[0] = Lo;
				2573	Ops[1] = Hi;
				2574	Ops[2] = InFlag;
				2575	Result = DAG.getNode(PPCISD::FADDRTZ, NodeTys, Ops, 3);
				2576	FPreg = Result.getValue(0);
				2577	InFlag = Result.getValue(1);
				2578
				2579	NodeTys.clear();
				2580	NodeTys.push_back(MVT::f64);
				2581	Ops[0] = DAG.getConstant(1, MVT::i32);
				2582	Ops[1] = MFFSreg;
				2583	Ops[2] = FPreg;
				2584	Ops[3] = InFlag;
				2585	Result = DAG.getNode(PPCISD::MTFSF, NodeTys, Ops, 4);
				2586	FPreg = Result.getValue(0);
				2587
				2588	// We know the low half is about to be thrown away, so just use something
				2589	// convenient.
				2590	return DAG.getNode(ISD::BUILD_PAIR, Lo.getValueType(), FPreg, FPreg);
				2591	}
				2592
Dale Johannesen	8be83a7	2008-03-04 23:17:14 +0000	[diff] [blame]	2593	SDOperand PPCTargetLowering::LowerSINT_TO_FP(SDOperand Op, SelectionDAG &DAG) {
Dan Gohman	8b232ff	2008-03-11 01:59:03 +0000	[diff] [blame]	2594	// Don't handle ppc_fp128 here; let it be lowered to a libcall.
				2595	if (Op.getValueType() != MVT::f32 && Op.getValueType() != MVT::f64)
				2596	return SDOperand();
				2597
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	2598	if (Op.getOperand(0).getValueType() == MVT::i64) {
				2599	SDOperand Bits = DAG.getNode(ISD::BIT_CONVERT, MVT::f64, Op.getOperand(0));
				2600	SDOperand FP = DAG.getNode(PPCISD::FCFID, MVT::f64, Bits);
				2601	if (Op.getValueType() == MVT::f32)
Chris Lattner	5872a36	2008-01-17 07:00:52 +0000	[diff] [blame]	2602	FP = DAG.getNode(ISD::FP_ROUND, MVT::f32, FP, DAG.getIntPtrConstant(0));
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	2603	return FP;
				2604	}
				2605
				2606	assert(Op.getOperand(0).getValueType() == MVT::i32 &&
				2607	"Unhandled SINT_TO_FP type in custom expander!");
				2608	// Since we only generate this in 64-bit mode, we can take advantage of
				2609	// 64-bit registers. In particular, sign extend the input value into the
				2610	// 64-bit register with extsw, store the WHOLE 64-bit value into the stack
				2611	// then lfd it and fcfid it.
				2612	MachineFrameInfo *FrameInfo = DAG.getMachineFunction().getFrameInfo();
				2613	int FrameIdx = FrameInfo->CreateStackObject(8, 8);
				2614	MVT::ValueType PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
				2615	SDOperand FIdx = DAG.getFrameIndex(FrameIdx, PtrVT);
				2616
				2617	SDOperand Ext64 = DAG.getNode(PPCISD::EXTSW_32, MVT::i32,
				2618	Op.getOperand(0));
				2619
				2620	// STD the extended value into the stack slot.
Dan Gohman	fb020b6	2008-02-07 18:41:25 +0000	[diff] [blame]	2621	MemOperand MO(PseudoSourceValue::getFixedStack(),
Dan Gohman	12a9c08	2008-02-06 22:27:42 +0000	[diff] [blame]	2622	MemOperand::MOStore, FrameIdx, 8, 8);
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	2623	SDOperand Store = DAG.getNode(PPCISD::STD_32, MVT::Other,
				2624	DAG.getEntryNode(), Ext64, FIdx,
Dan Gohman	12a9c08	2008-02-06 22:27:42 +0000	[diff] [blame]	2625	DAG.getMemOperand(MO));
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	2626	// Load the value as a double.
				2627	SDOperand Ld = DAG.getLoad(MVT::f64, Store, FIdx, NULL, 0);
				2628
				2629	// FCFID it and return it.
				2630	SDOperand FP = DAG.getNode(PPCISD::FCFID, MVT::f64, Ld);
				2631	if (Op.getValueType() == MVT::f32)
Chris Lattner	5872a36	2008-01-17 07:00:52 +0000	[diff] [blame]	2632	FP = DAG.getNode(ISD::FP_ROUND, MVT::f32, FP, DAG.getIntPtrConstant(0));
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	2633	return FP;
				2634	}
				2635
Dale Johannesen	8be83a7	2008-03-04 23:17:14 +0000	[diff] [blame]	2636	SDOperand PPCTargetLowering::LowerFLT_ROUNDS_(SDOperand Op, SelectionDAG &DAG) {
Dale Johannesen	436e380	2008-01-18 19:55:37 +0000	[diff] [blame]	2637	/*
				2638	The rounding mode is in bits 30:31 of FPSR, and has the following
				2639	settings:
				2640	00 Round to nearest
				2641	01 Round to 0
				2642	10 Round to +inf
				2643	11 Round to -inf
				2644
				2645	FLT_ROUNDS, on the other hand, expects the following:
				2646	-1 Undefined
				2647	0 Round to 0
				2648	1 Round to nearest
				2649	2 Round to +inf
				2650	3 Round to -inf
				2651
				2652	To perform the conversion, we do:
				2653	((FPSCR & 0x3) ^ ((~FPSCR & 0x3) >> 1))
				2654	*/
				2655
				2656	MachineFunction &MF = DAG.getMachineFunction();
				2657	MVT::ValueType VT = Op.getValueType();
				2658	MVT::ValueType PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
				2659	std::vector<MVT::ValueType> NodeTys;
				2660	SDOperand MFFSreg, InFlag;
				2661
				2662	// Save FP Control Word to register
				2663	NodeTys.push_back(MVT::f64); // return register
				2664	NodeTys.push_back(MVT::Flag); // unused in this context
				2665	SDOperand Chain = DAG.getNode(PPCISD::MFFS, NodeTys, &InFlag, 0);
				2666
				2667	// Save FP register to stack slot
				2668	int SSFI = MF.getFrameInfo()->CreateStackObject(8, 8);
				2669	SDOperand StackSlot = DAG.getFrameIndex(SSFI, PtrVT);
				2670	SDOperand Store = DAG.getStore(DAG.getEntryNode(), Chain,
				2671	StackSlot, NULL, 0);
				2672
				2673	// Load FP Control Word from low 32 bits of stack slot.
				2674	SDOperand Four = DAG.getConstant(4, PtrVT);
				2675	SDOperand Addr = DAG.getNode(ISD::ADD, PtrVT, StackSlot, Four);
				2676	SDOperand CWD = DAG.getLoad(MVT::i32, Store, Addr, NULL, 0);
				2677
				2678	// Transform as necessary
				2679	SDOperand CWD1 =
				2680	DAG.getNode(ISD::AND, MVT::i32,
				2681	CWD, DAG.getConstant(3, MVT::i32));
				2682	SDOperand CWD2 =
				2683	DAG.getNode(ISD::SRL, MVT::i32,
				2684	DAG.getNode(ISD::AND, MVT::i32,
				2685	DAG.getNode(ISD::XOR, MVT::i32,
				2686	CWD, DAG.getConstant(3, MVT::i32)),
				2687	DAG.getConstant(3, MVT::i32)),
				2688	DAG.getConstant(1, MVT::i8));
				2689
				2690	SDOperand RetVal =
				2691	DAG.getNode(ISD::XOR, MVT::i32, CWD1, CWD2);
				2692
				2693	return DAG.getNode((MVT::getSizeInBits(VT) < 16 ?
				2694	ISD::TRUNCATE : ISD::ZERO_EXTEND), VT, RetVal);
				2695	}
				2696
Dale Johannesen	8be83a7	2008-03-04 23:17:14 +0000	[diff] [blame]	2697	SDOperand PPCTargetLowering::LowerSHL_PARTS(SDOperand Op, SelectionDAG &DAG) {
Dan Gohman	71619ec	2008-03-07 20:36:53 +0000	[diff] [blame]	2698	MVT::ValueType VT = Op.getValueType();
				2699	unsigned BitWidth = MVT::getSizeInBits(VT);
				2700	assert(Op.getNumOperands() == 3 &&
				2701	VT == Op.getOperand(1).getValueType() &&
				2702	"Unexpected SHL!");
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	2703
				2704	// Expand into a bunch of logical ops. Note that these ops
				2705	// depend on the PPC behavior for oversized shift amounts.
				2706	SDOperand Lo = Op.getOperand(0);
				2707	SDOperand Hi = Op.getOperand(1);
				2708	SDOperand Amt = Op.getOperand(2);
Dan Gohman	71619ec	2008-03-07 20:36:53 +0000	[diff] [blame]	2709	MVT::ValueType AmtVT = Amt.getValueType();
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	2710
Dan Gohman	71619ec	2008-03-07 20:36:53 +0000	[diff] [blame]	2711	SDOperand Tmp1 = DAG.getNode(ISD::SUB, AmtVT,
				2712	DAG.getConstant(BitWidth, AmtVT), Amt);
				2713	SDOperand Tmp2 = DAG.getNode(PPCISD::SHL, VT, Hi, Amt);
				2714	SDOperand Tmp3 = DAG.getNode(PPCISD::SRL, VT, Lo, Tmp1);
				2715	SDOperand Tmp4 = DAG.getNode(ISD::OR , VT, Tmp2, Tmp3);
				2716	SDOperand Tmp5 = DAG.getNode(ISD::ADD, AmtVT, Amt,
				2717	DAG.getConstant(-BitWidth, AmtVT));
				2718	SDOperand Tmp6 = DAG.getNode(PPCISD::SHL, VT, Lo, Tmp5);
				2719	SDOperand OutHi = DAG.getNode(ISD::OR, VT, Tmp4, Tmp6);
				2720	SDOperand OutLo = DAG.getNode(PPCISD::SHL, VT, Lo, Amt);
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	2721	SDOperand OutOps[] = { OutLo, OutHi };
Dan Gohman	71619ec	2008-03-07 20:36:53 +0000	[diff] [blame]	2722	return DAG.getNode(ISD::MERGE_VALUES, DAG.getVTList(VT, VT),
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	2723	OutOps, 2);
				2724	}
				2725
Dale Johannesen	8be83a7	2008-03-04 23:17:14 +0000	[diff] [blame]	2726	SDOperand PPCTargetLowering::LowerSRL_PARTS(SDOperand Op, SelectionDAG &DAG) {
Dan Gohman	71619ec	2008-03-07 20:36:53 +0000	[diff] [blame]	2727	MVT::ValueType VT = Op.getValueType();
				2728	unsigned BitWidth = MVT::getSizeInBits(VT);
				2729	assert(Op.getNumOperands() == 3 &&
				2730	VT == Op.getOperand(1).getValueType() &&
				2731	"Unexpected SRL!");
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	2732
Dan Gohman	71619ec	2008-03-07 20:36:53 +0000	[diff] [blame]	2733	// Expand into a bunch of logical ops. Note that these ops
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	2734	// depend on the PPC behavior for oversized shift amounts.
				2735	SDOperand Lo = Op.getOperand(0);
				2736	SDOperand Hi = Op.getOperand(1);
				2737	SDOperand Amt = Op.getOperand(2);
Dan Gohman	71619ec	2008-03-07 20:36:53 +0000	[diff] [blame]	2738	MVT::ValueType AmtVT = Amt.getValueType();
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	2739
Dan Gohman	71619ec	2008-03-07 20:36:53 +0000	[diff] [blame]	2740	SDOperand Tmp1 = DAG.getNode(ISD::SUB, AmtVT,
				2741	DAG.getConstant(BitWidth, AmtVT), Amt);
				2742	SDOperand Tmp2 = DAG.getNode(PPCISD::SRL, VT, Lo, Amt);
				2743	SDOperand Tmp3 = DAG.getNode(PPCISD::SHL, VT, Hi, Tmp1);
				2744	SDOperand Tmp4 = DAG.getNode(ISD::OR , VT, Tmp2, Tmp3);
				2745	SDOperand Tmp5 = DAG.getNode(ISD::ADD, AmtVT, Amt,
				2746	DAG.getConstant(-BitWidth, AmtVT));
				2747	SDOperand Tmp6 = DAG.getNode(PPCISD::SRL, VT, Hi, Tmp5);
				2748	SDOperand OutLo = DAG.getNode(ISD::OR, VT, Tmp4, Tmp6);
				2749	SDOperand OutHi = DAG.getNode(PPCISD::SRL, VT, Hi, Amt);
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	2750	SDOperand OutOps[] = { OutLo, OutHi };
Dan Gohman	71619ec	2008-03-07 20:36:53 +0000	[diff] [blame]	2751	return DAG.getNode(ISD::MERGE_VALUES, DAG.getVTList(VT, VT),
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	2752	OutOps, 2);
				2753	}
				2754
Dale Johannesen	8be83a7	2008-03-04 23:17:14 +0000	[diff] [blame]	2755	SDOperand PPCTargetLowering::LowerSRA_PARTS(SDOperand Op, SelectionDAG &DAG) {
Dan Gohman	71619ec	2008-03-07 20:36:53 +0000	[diff] [blame]	2756	MVT::ValueType VT = Op.getValueType();
				2757	unsigned BitWidth = MVT::getSizeInBits(VT);
				2758	assert(Op.getNumOperands() == 3 &&
				2759	VT == Op.getOperand(1).getValueType() &&
				2760	"Unexpected SRA!");
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	2761
Dan Gohman	71619ec	2008-03-07 20:36:53 +0000	[diff] [blame]	2762	// Expand into a bunch of logical ops, followed by a select_cc.
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	2763	SDOperand Lo = Op.getOperand(0);
				2764	SDOperand Hi = Op.getOperand(1);
				2765	SDOperand Amt = Op.getOperand(2);
Dan Gohman	71619ec	2008-03-07 20:36:53 +0000	[diff] [blame]	2766	MVT::ValueType AmtVT = Amt.getValueType();
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	2767
Dan Gohman	71619ec	2008-03-07 20:36:53 +0000	[diff] [blame]	2768	SDOperand Tmp1 = DAG.getNode(ISD::SUB, AmtVT,
				2769	DAG.getConstant(BitWidth, AmtVT), Amt);
				2770	SDOperand Tmp2 = DAG.getNode(PPCISD::SRL, VT, Lo, Amt);
				2771	SDOperand Tmp3 = DAG.getNode(PPCISD::SHL, VT, Hi, Tmp1);
				2772	SDOperand Tmp4 = DAG.getNode(ISD::OR , VT, Tmp2, Tmp3);
				2773	SDOperand Tmp5 = DAG.getNode(ISD::ADD, AmtVT, Amt,
				2774	DAG.getConstant(-BitWidth, AmtVT));
				2775	SDOperand Tmp6 = DAG.getNode(PPCISD::SRA, VT, Hi, Tmp5);
				2776	SDOperand OutHi = DAG.getNode(PPCISD::SRA, VT, Hi, Amt);
				2777	SDOperand OutLo = DAG.getSelectCC(Tmp5, DAG.getConstant(0, AmtVT),
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	2778	Tmp4, Tmp6, ISD::SETLE);
				2779	SDOperand OutOps[] = { OutLo, OutHi };
Dan Gohman	71619ec	2008-03-07 20:36:53 +0000	[diff] [blame]	2780	return DAG.getNode(ISD::MERGE_VALUES, DAG.getVTList(VT, VT),
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	2781	OutOps, 2);
				2782	}
				2783
				2784	//===----------------------------------------------------------------------===//
				2785	// Vector related lowering.
				2786	//
				2787
				2788	// If this is a vector of constants or undefs, get the bits. A bit in
				2789	// UndefBits is set if the corresponding element of the vector is an
				2790	// ISD::UNDEF value. For undefs, the corresponding VectorBits values are
				2791	// zero. Return true if this is not an array of constants, false if it is.
				2792	//
				2793	static bool GetConstantBuildVectorBits(SDNode *BV, uint64_t VectorBits[2],
				2794	uint64_t UndefBits[2]) {
				2795	// Start with zero'd results.
				2796	VectorBits[0] = VectorBits[1] = UndefBits[0] = UndefBits[1] = 0;
				2797
				2798	unsigned EltBitSize = MVT::getSizeInBits(BV->getOperand(0).getValueType());
				2799	for (unsigned i = 0, e = BV->getNumOperands(); i != e; ++i) {
				2800	SDOperand OpVal = BV->getOperand(i);
				2801
				2802	unsigned PartNo = i >= e/2; // In the upper 128 bits?
				2803	unsigned SlotNo = e/2 - (i & (e/2-1))-1; // Which subpiece of the uint64_t.
				2804
				2805	uint64_t EltBits = 0;
				2806	if (OpVal.getOpcode() == ISD::UNDEF) {
				2807	uint64_t EltUndefBits = ~0U >> (32-EltBitSize);
				2808	UndefBits[PartNo] \|= EltUndefBits << (SlotNo*EltBitSize);
				2809	continue;
				2810	} else if (ConstantSDNode *CN = dyn_cast<ConstantSDNode>(OpVal)) {
				2811	EltBits = CN->getValue() & (~0U >> (32-EltBitSize));
				2812	} else if (ConstantFPSDNode *CN = dyn_cast<ConstantFPSDNode>(OpVal)) {
				2813	assert(CN->getValueType(0) == MVT::f32 &&
				2814	"Only one legal FP vector type!");
Dale Johannesen	df8a831	2007-08-31 04:03:46 +0000	[diff] [blame]	2815	EltBits = FloatToBits(CN->getValueAPF().convertToFloat());
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	2816	} else {
				2817	// Nonconstant element.
				2818	return true;
				2819	}
				2820
				2821	VectorBits[PartNo] \|= EltBits << (SlotNo*EltBitSize);
				2822	}
				2823
				2824	//printf("%llx %llx %llx %llx\n",
				2825	// VectorBits[0], VectorBits[1], UndefBits[0], UndefBits[1]);
				2826	return false;
				2827	}
				2828
				2829	// If this is a splat (repetition) of a value across the whole vector, return
				2830	// the smallest size that splats it. For example, "0x01010101010101..." is a
				2831	// splat of 0x01, 0x0101, and 0x01010101. We return SplatBits = 0x01 and
				2832	// SplatSize = 1 byte.
				2833	static bool isConstantSplat(const uint64_t Bits128[2],
				2834	const uint64_t Undef128[2],
				2835	unsigned &SplatBits, unsigned &SplatUndef,
				2836	unsigned &SplatSize) {
				2837
				2838	// Don't let undefs prevent splats from matching. See if the top 64-bits are
				2839	// the same as the lower 64-bits, ignoring undefs.
				2840	if ((Bits128[0] & ~Undef128[1]) != (Bits128[1] & ~Undef128[0]))
				2841	return false; // Can't be a splat if two pieces don't match.
				2842
				2843	uint64_t Bits64 = Bits128[0] \| Bits128[1];
				2844	uint64_t Undef64 = Undef128[0] & Undef128[1];
				2845
				2846	// Check that the top 32-bits are the same as the lower 32-bits, ignoring
				2847	// undefs.
				2848	if ((Bits64 & (~Undef64 >> 32)) != ((Bits64 >> 32) & ~Undef64))
				2849	return false; // Can't be a splat if two pieces don't match.
				2850
				2851	uint32_t Bits32 = uint32_t(Bits64) \| uint32_t(Bits64 >> 32);
				2852	uint32_t Undef32 = uint32_t(Undef64) & uint32_t(Undef64 >> 32);
				2853
				2854	// If the top 16-bits are different than the lower 16-bits, ignoring
				2855	// undefs, we have an i32 splat.
				2856	if ((Bits32 & (~Undef32 >> 16)) != ((Bits32 >> 16) & ~Undef32)) {
				2857	SplatBits = Bits32;
				2858	SplatUndef = Undef32;
				2859	SplatSize = 4;
				2860	return true;
				2861	}
				2862
				2863	uint16_t Bits16 = uint16_t(Bits32) \| uint16_t(Bits32 >> 16);
				2864	uint16_t Undef16 = uint16_t(Undef32) & uint16_t(Undef32 >> 16);
				2865
				2866	// If the top 8-bits are different than the lower 8-bits, ignoring
				2867	// undefs, we have an i16 splat.
				2868	if ((Bits16 & (uint16_t(~Undef16) >> 8)) != ((Bits16 >> 8) & ~Undef16)) {
				2869	SplatBits = Bits16;
				2870	SplatUndef = Undef16;
				2871	SplatSize = 2;
				2872	return true;
				2873	}
				2874
				2875	// Otherwise, we have an 8-bit splat.
				2876	SplatBits = uint8_t(Bits16) \| uint8_t(Bits16 >> 8);
				2877	SplatUndef = uint8_t(Undef16) & uint8_t(Undef16 >> 8);
				2878	SplatSize = 1;
				2879	return true;
				2880	}
				2881
				2882	/// BuildSplatI - Build a canonical splati of Val with an element size of
				2883	/// SplatSize. Cast the result to VT.
				2884	static SDOperand BuildSplatI(int Val, unsigned SplatSize, MVT::ValueType VT,
				2885	SelectionDAG &DAG) {
				2886	assert(Val >= -16 && Val <= 15 && "vsplti is out of range!");
				2887
				2888	static const MVT::ValueType VTys[] = { // canonical VT to use for each size.
				2889	MVT::v16i8, MVT::v8i16, MVT::Other, MVT::v4i32
				2890	};
				2891
				2892	MVT::ValueType ReqVT = VT != MVT::Other ? VT : VTys[SplatSize-1];
				2893
				2894	// Force vspltis[hw] -1 to vspltisb -1 to canonicalize.
				2895	if (Val == -1)
				2896	SplatSize = 1;
				2897
				2898	MVT::ValueType CanonicalVT = VTys[SplatSize-1];
				2899
				2900	// Build a canonical splat for this value.
				2901	SDOperand Elt = DAG.getConstant(Val, MVT::getVectorElementType(CanonicalVT));
				2902	SmallVector<SDOperand, 8> Ops;
				2903	Ops.assign(MVT::getVectorNumElements(CanonicalVT), Elt);
				2904	SDOperand Res = DAG.getNode(ISD::BUILD_VECTOR, CanonicalVT,
				2905	&Ops[0], Ops.size());
				2906	return DAG.getNode(ISD::BIT_CONVERT, ReqVT, Res);
				2907	}
				2908
				2909	/// BuildIntrinsicOp - Return a binary operator intrinsic node with the
				2910	/// specified intrinsic ID.
				2911	static SDOperand BuildIntrinsicOp(unsigned IID, SDOperand LHS, SDOperand RHS,
				2912	SelectionDAG &DAG,
				2913	MVT::ValueType DestVT = MVT::Other) {
				2914	if (DestVT == MVT::Other) DestVT = LHS.getValueType();
				2915	return DAG.getNode(ISD::INTRINSIC_WO_CHAIN, DestVT,
				2916	DAG.getConstant(IID, MVT::i32), LHS, RHS);
				2917	}
				2918
				2919	/// BuildIntrinsicOp - Return a ternary operator intrinsic node with the
				2920	/// specified intrinsic ID.
				2921	static SDOperand BuildIntrinsicOp(unsigned IID, SDOperand Op0, SDOperand Op1,
				2922	SDOperand Op2, SelectionDAG &DAG,
				2923	MVT::ValueType DestVT = MVT::Other) {
				2924	if (DestVT == MVT::Other) DestVT = Op0.getValueType();
				2925	return DAG.getNode(ISD::INTRINSIC_WO_CHAIN, DestVT,
				2926	DAG.getConstant(IID, MVT::i32), Op0, Op1, Op2);
				2927	}
				2928
				2929
				2930	/// BuildVSLDOI - Return a VECTOR_SHUFFLE that is a vsldoi of the specified
				2931	/// amount. The result has the specified value type.
				2932	static SDOperand BuildVSLDOI(SDOperand LHS, SDOperand RHS, unsigned Amt,
				2933	MVT::ValueType VT, SelectionDAG &DAG) {
				2934	// Force LHS/RHS to be the right type.
				2935	LHS = DAG.getNode(ISD::BIT_CONVERT, MVT::v16i8, LHS);
				2936	RHS = DAG.getNode(ISD::BIT_CONVERT, MVT::v16i8, RHS);
				2937
				2938	SDOperand Ops[16];
				2939	for (unsigned i = 0; i != 16; ++i)
				2940	Ops[i] = DAG.getConstant(i+Amt, MVT::i32);
				2941	SDOperand T = DAG.getNode(ISD::VECTOR_SHUFFLE, MVT::v16i8, LHS, RHS,
				2942	DAG.getNode(ISD::BUILD_VECTOR, MVT::v16i8, Ops,16));
				2943	return DAG.getNode(ISD::BIT_CONVERT, VT, T);
				2944	}
				2945
				2946	// If this is a case we can't handle, return null and let the default
				2947	// expansion code take care of it. If we CAN select this case, and if it
				2948	// selects to a single instruction, return Op. Otherwise, if we can codegen
				2949	// this case more efficiently than a constant pool load, lower it to the
				2950	// sequence of ops that should be used.
Dale Johannesen	8be83a7	2008-03-04 23:17:14 +0000	[diff] [blame]	2951	SDOperand PPCTargetLowering::LowerBUILD_VECTOR(SDOperand Op,
				2952	SelectionDAG &DAG) {
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	2953	// If this is a vector of constants or undefs, get the bits. A bit in
				2954	// UndefBits is set if the corresponding element of the vector is an
				2955	// ISD::UNDEF value. For undefs, the corresponding VectorBits values are
				2956	// zero.
				2957	uint64_t VectorBits[2];
				2958	uint64_t UndefBits[2];
				2959	if (GetConstantBuildVectorBits(Op.Val, VectorBits, UndefBits))
				2960	return SDOperand(); // Not a constant vector.
				2961
				2962	// If this is a splat (repetition) of a value across the whole vector, return
				2963	// the smallest size that splats it. For example, "0x01010101010101..." is a
				2964	// splat of 0x01, 0x0101, and 0x01010101. We return SplatBits = 0x01 and
				2965	// SplatSize = 1 byte.
				2966	unsigned SplatBits, SplatUndef, SplatSize;
				2967	if (isConstantSplat(VectorBits, UndefBits, SplatBits, SplatUndef, SplatSize)){
				2968	bool HasAnyUndefs = (UndefBits[0] \| UndefBits[1]) != 0;
				2969
				2970	// First, handle single instruction cases.
				2971
				2972	// All zeros?
				2973	if (SplatBits == 0) {
				2974	// Canonicalize all zero vectors to be v4i32.
				2975	if (Op.getValueType() != MVT::v4i32 \|\| HasAnyUndefs) {
				2976	SDOperand Z = DAG.getConstant(0, MVT::i32);
				2977	Z = DAG.getNode(ISD::BUILD_VECTOR, MVT::v4i32, Z, Z, Z, Z);
				2978	Op = DAG.getNode(ISD::BIT_CONVERT, Op.getValueType(), Z);
				2979	}
				2980	return Op;
				2981	}
				2982
				2983	// If the sign extended value is in the range [-16,15], use VSPLTI[bhw].
				2984	int32_t SextVal= int32_t(SplatBits << (32-8SplatSize)) >> (32-8SplatSize);
				2985	if (SextVal >= -16 && SextVal <= 15)
				2986	return BuildSplatI(SextVal, SplatSize, Op.getValueType(), DAG);
				2987
				2988
				2989	// Two instruction sequences.
				2990
				2991	// If this value is in the range [-32,30] and is even, use:
				2992	// tmp = VSPLTI[bhw], result = add tmp, tmp
				2993	if (SextVal >= -32 && SextVal <= 30 && (SextVal & 1) == 0) {
				2994	Op = BuildSplatI(SextVal >> 1, SplatSize, Op.getValueType(), DAG);
				2995	return DAG.getNode(ISD::ADD, Op.getValueType(), Op, Op);
				2996	}
				2997
				2998	// If this is 0x8000_0000 x 4, turn into vspltisw + vslw. If it is
				2999	// 0x7FFF_FFFF x 4, turn it into not(0x8000_0000). This is important
				3000	// for fneg/fabs.
				3001	if (SplatSize == 4 && SplatBits == (0x7FFFFFFF&~SplatUndef)) {
				3002	// Make -1 and vspltisw -1:
				3003	SDOperand OnesV = BuildSplatI(-1, 4, MVT::v4i32, DAG);
				3004
				3005	// Make the VSLW intrinsic, computing 0x8000_0000.
				3006	SDOperand Res = BuildIntrinsicOp(Intrinsic::ppc_altivec_vslw, OnesV,
				3007	OnesV, DAG);
				3008
				3009	// xor by OnesV to invert it.
				3010	Res = DAG.getNode(ISD::XOR, MVT::v4i32, Res, OnesV);
				3011	return DAG.getNode(ISD::BIT_CONVERT, Op.getValueType(), Res);
				3012	}
				3013
				3014	// Check to see if this is a wide variety of vsplti*, binop self cases.
				3015	unsigned SplatBitSize = SplatSize*8;
				3016	static const signed char SplatCsts[] = {
				3017	-1, 1, -2, 2, -3, 3, -4, 4, -5, 5, -6, 6, -7, 7,
				3018	-8, 8, -9, 9, -10, 10, -11, 11, -12, 12, -13, 13, 14, -14, 15, -15, -16
				3019	};
				3020
Owen Anderson	1636de9	2007-09-07 04:06:50 +0000	[diff] [blame]	3021	for (unsigned idx = 0; idx < array_lengthof(SplatCsts); ++idx) {
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	3022	// Indirect through the SplatCsts array so that we favor 'vsplti -1' for
				3023	// cases which are ambiguous (e.g. formation of 0x8000_0000). 'vsplti -1'
				3024	int i = SplatCsts[idx];
				3025
				3026	// Figure out what shift amount will be used by altivec if shifted by i in
				3027	// this splat size.
				3028	unsigned TypeShiftAmt = i & (SplatBitSize-1);
				3029
				3030	// vsplti + shl self.
				3031	if (SextVal == (i << (int)TypeShiftAmt)) {
				3032	SDOperand Res = BuildSplatI(i, SplatSize, MVT::Other, DAG);
				3033	static const unsigned IIDs[] = { // Intrinsic to use for each size.
				3034	Intrinsic::ppc_altivec_vslb, Intrinsic::ppc_altivec_vslh, 0,
				3035	Intrinsic::ppc_altivec_vslw
				3036	};
				3037	Res = BuildIntrinsicOp(IIDs[SplatSize-1], Res, Res, DAG);
				3038	return DAG.getNode(ISD::BIT_CONVERT, Op.getValueType(), Res);
				3039	}
				3040
				3041	// vsplti + srl self.
				3042	if (SextVal == (int)((unsigned)i >> TypeShiftAmt)) {
				3043	SDOperand Res = BuildSplatI(i, SplatSize, MVT::Other, DAG);
				3044	static const unsigned IIDs[] = { // Intrinsic to use for each size.
				3045	Intrinsic::ppc_altivec_vsrb, Intrinsic::ppc_altivec_vsrh, 0,
				3046	Intrinsic::ppc_altivec_vsrw
				3047	};
				3048	Res = BuildIntrinsicOp(IIDs[SplatSize-1], Res, Res, DAG);
				3049	return DAG.getNode(ISD::BIT_CONVERT, Op.getValueType(), Res);
				3050	}
				3051
				3052	// vsplti + sra self.
				3053	if (SextVal == (int)((unsigned)i >> TypeShiftAmt)) {
				3054	SDOperand Res = BuildSplatI(i, SplatSize, MVT::Other, DAG);
				3055	static const unsigned IIDs[] = { // Intrinsic to use for each size.
				3056	Intrinsic::ppc_altivec_vsrab, Intrinsic::ppc_altivec_vsrah, 0,
				3057	Intrinsic::ppc_altivec_vsraw
				3058	};
				3059	Res = BuildIntrinsicOp(IIDs[SplatSize-1], Res, Res, DAG);
				3060	return DAG.getNode(ISD::BIT_CONVERT, Op.getValueType(), Res);
				3061	}
				3062
				3063	// vsplti + rol self.
				3064	if (SextVal == (int)(((unsigned)i << TypeShiftAmt) \|
				3065	((unsigned)i >> (SplatBitSize-TypeShiftAmt)))) {
				3066	SDOperand Res = BuildSplatI(i, SplatSize, MVT::Other, DAG);
				3067	static const unsigned IIDs[] = { // Intrinsic to use for each size.
				3068	Intrinsic::ppc_altivec_vrlb, Intrinsic::ppc_altivec_vrlh, 0,
				3069	Intrinsic::ppc_altivec_vrlw
				3070	};
				3071	Res = BuildIntrinsicOp(IIDs[SplatSize-1], Res, Res, DAG);
				3072	return DAG.getNode(ISD::BIT_CONVERT, Op.getValueType(), Res);
				3073	}
				3074
				3075	// t = vsplti c, result = vsldoi t, t, 1
				3076	if (SextVal == ((i << 8) \| (i >> (TypeShiftAmt-8)))) {
				3077	SDOperand T = BuildSplatI(i, SplatSize, MVT::v16i8, DAG);
				3078	return BuildVSLDOI(T, T, 1, Op.getValueType(), DAG);
				3079	}
				3080	// t = vsplti c, result = vsldoi t, t, 2
				3081	if (SextVal == ((i << 16) \| (i >> (TypeShiftAmt-16)))) {
				3082	SDOperand T = BuildSplatI(i, SplatSize, MVT::v16i8, DAG);
				3083	return BuildVSLDOI(T, T, 2, Op.getValueType(), DAG);
				3084	}
				3085	// t = vsplti c, result = vsldoi t, t, 3
				3086	if (SextVal == ((i << 24) \| (i >> (TypeShiftAmt-24)))) {
				3087	SDOperand T = BuildSplatI(i, SplatSize, MVT::v16i8, DAG);
				3088	return BuildVSLDOI(T, T, 3, Op.getValueType(), DAG);
				3089	}
				3090	}
				3091
				3092	// Three instruction sequences.
				3093
				3094	// Odd, in range [17,31]: (vsplti C)-(vsplti -16).
				3095	if (SextVal >= 0 && SextVal <= 31) {
				3096	SDOperand LHS = BuildSplatI(SextVal-16, SplatSize, MVT::Other, DAG);
				3097	SDOperand RHS = BuildSplatI(-16, SplatSize, MVT::Other, DAG);
Dale Johannesen	6fdf931	2007-10-14 01:58:32 +0000	[diff] [blame]	3098	LHS = DAG.getNode(ISD::SUB, LHS.getValueType(), LHS, RHS);
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	3099	return DAG.getNode(ISD::BIT_CONVERT, Op.getValueType(), LHS);
				3100	}
				3101	// Odd, in range [-31,-17]: (vsplti C)+(vsplti -16).
				3102	if (SextVal >= -31 && SextVal <= 0) {
				3103	SDOperand LHS = BuildSplatI(SextVal+16, SplatSize, MVT::Other, DAG);
				3104	SDOperand RHS = BuildSplatI(-16, SplatSize, MVT::Other, DAG);
Dale Johannesen	6fdf931	2007-10-14 01:58:32 +0000	[diff] [blame]	3105	LHS = DAG.getNode(ISD::ADD, LHS.getValueType(), LHS, RHS);
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	3106	return DAG.getNode(ISD::BIT_CONVERT, Op.getValueType(), LHS);
				3107	}
				3108	}
				3109
				3110	return SDOperand();
				3111	}
				3112
				3113	/// GeneratePerfectShuffle - Given an entry in the perfect-shuffle table, emit
				3114	/// the specified operations to build the shuffle.
				3115	static SDOperand GeneratePerfectShuffle(unsigned PFEntry, SDOperand LHS,
				3116	SDOperand RHS, SelectionDAG &DAG) {
				3117	unsigned OpNum = (PFEntry >> 26) & 0x0F;
				3118	unsigned LHSID = (PFEntry >> 13) & ((1 << 13)-1);
				3119	unsigned RHSID = (PFEntry >> 0) & ((1 << 13)-1);
				3120
				3121	enum {
				3122	OP_COPY = 0, // Copy, used for things like <u,u,u,3> to say it is <0,1,2,3>
				3123	OP_VMRGHW,
				3124	OP_VMRGLW,
				3125	OP_VSPLTISW0,
				3126	OP_VSPLTISW1,
				3127	OP_VSPLTISW2,
				3128	OP_VSPLTISW3,
				3129	OP_VSLDOI4,
				3130	OP_VSLDOI8,
				3131	OP_VSLDOI12
				3132	};
				3133
				3134	if (OpNum == OP_COPY) {
				3135	if (LHSID == (19+2)9+3) return LHS;
				3136	assert(LHSID == ((49+5)9+6)*9+7 && "Illegal OP_COPY!");
				3137	return RHS;
				3138	}
				3139
				3140	SDOperand OpLHS, OpRHS;
				3141	OpLHS = GeneratePerfectShuffle(PerfectShuffleTable[LHSID], LHS, RHS, DAG);
				3142	OpRHS = GeneratePerfectShuffle(PerfectShuffleTable[RHSID], LHS, RHS, DAG);
				3143
				3144	unsigned ShufIdxs[16];
				3145	switch (OpNum) {
				3146	default: assert(0 && "Unknown i32 permute!");
				3147	case OP_VMRGHW:
				3148	ShufIdxs[ 0] = 0; ShufIdxs[ 1] = 1; ShufIdxs[ 2] = 2; ShufIdxs[ 3] = 3;
				3149	ShufIdxs[ 4] = 16; ShufIdxs[ 5] = 17; ShufIdxs[ 6] = 18; ShufIdxs[ 7] = 19;
				3150	ShufIdxs[ 8] = 4; ShufIdxs[ 9] = 5; ShufIdxs[10] = 6; ShufIdxs[11] = 7;
				3151	ShufIdxs[12] = 20; ShufIdxs[13] = 21; ShufIdxs[14] = 22; ShufIdxs[15] = 23;
				3152	break;
				3153	case OP_VMRGLW:
				3154	ShufIdxs[ 0] = 8; ShufIdxs[ 1] = 9; ShufIdxs[ 2] = 10; ShufIdxs[ 3] = 11;
				3155	ShufIdxs[ 4] = 24; ShufIdxs[ 5] = 25; ShufIdxs[ 6] = 26; ShufIdxs[ 7] = 27;
				3156	ShufIdxs[ 8] = 12; ShufIdxs[ 9] = 13; ShufIdxs[10] = 14; ShufIdxs[11] = 15;
				3157	ShufIdxs[12] = 28; ShufIdxs[13] = 29; ShufIdxs[14] = 30; ShufIdxs[15] = 31;
				3158	break;
				3159	case OP_VSPLTISW0:
				3160	for (unsigned i = 0; i != 16; ++i)
				3161	ShufIdxs[i] = (i&3)+0;
				3162	break;
				3163	case OP_VSPLTISW1:
				3164	for (unsigned i = 0; i != 16; ++i)
				3165	ShufIdxs[i] = (i&3)+4;
				3166	break;
				3167	case OP_VSPLTISW2:
				3168	for (unsigned i = 0; i != 16; ++i)
				3169	ShufIdxs[i] = (i&3)+8;
				3170	break;
				3171	case OP_VSPLTISW3:
				3172	for (unsigned i = 0; i != 16; ++i)
				3173	ShufIdxs[i] = (i&3)+12;
				3174	break;
				3175	case OP_VSLDOI4:
				3176	return BuildVSLDOI(OpLHS, OpRHS, 4, OpLHS.getValueType(), DAG);
				3177	case OP_VSLDOI8:
				3178	return BuildVSLDOI(OpLHS, OpRHS, 8, OpLHS.getValueType(), DAG);
				3179	case OP_VSLDOI12:
				3180	return BuildVSLDOI(OpLHS, OpRHS, 12, OpLHS.getValueType(), DAG);
				3181	}
				3182	SDOperand Ops[16];
				3183	for (unsigned i = 0; i != 16; ++i)
				3184	Ops[i] = DAG.getConstant(ShufIdxs[i], MVT::i32);
				3185
				3186	return DAG.getNode(ISD::VECTOR_SHUFFLE, OpLHS.getValueType(), OpLHS, OpRHS,
				3187	DAG.getNode(ISD::BUILD_VECTOR, MVT::v16i8, Ops, 16));
				3188	}
				3189
				3190	/// LowerVECTOR_SHUFFLE - Return the code we lower for VECTOR_SHUFFLE. If this
				3191	/// is a shuffle we can handle in a single instruction, return it. Otherwise,
				3192	/// return the code it can be lowered into. Worst case, it can always be
				3193	/// lowered into a vperm.
Dale Johannesen	8be83a7	2008-03-04 23:17:14 +0000	[diff] [blame]	3194	SDOperand PPCTargetLowering::LowerVECTOR_SHUFFLE(SDOperand Op,
				3195	SelectionDAG &DAG) {
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	3196	SDOperand V1 = Op.getOperand(0);
				3197	SDOperand V2 = Op.getOperand(1);
				3198	SDOperand PermMask = Op.getOperand(2);
				3199
				3200	// Cases that are handled by instructions that take permute immediates
				3201	// (such as vsplt*) should be left as VECTOR_SHUFFLE nodes so they can be
				3202	// selected by the instruction selector.
				3203	if (V2.getOpcode() == ISD::UNDEF) {
				3204	if (PPC::isSplatShuffleMask(PermMask.Val, 1) \|\|
				3205	PPC::isSplatShuffleMask(PermMask.Val, 2) \|\|
				3206	PPC::isSplatShuffleMask(PermMask.Val, 4) \|\|
				3207	PPC::isVPKUWUMShuffleMask(PermMask.Val, true) \|\|
				3208	PPC::isVPKUHUMShuffleMask(PermMask.Val, true) \|\|
				3209	PPC::isVSLDOIShuffleMask(PermMask.Val, true) != -1 \|\|
				3210	PPC::isVMRGLShuffleMask(PermMask.Val, 1, true) \|\|
				3211	PPC::isVMRGLShuffleMask(PermMask.Val, 2, true) \|\|
				3212	PPC::isVMRGLShuffleMask(PermMask.Val, 4, true) \|\|
				3213	PPC::isVMRGHShuffleMask(PermMask.Val, 1, true) \|\|
				3214	PPC::isVMRGHShuffleMask(PermMask.Val, 2, true) \|\|
				3215	PPC::isVMRGHShuffleMask(PermMask.Val, 4, true)) {
				3216	return Op;
				3217	}
				3218	}
				3219
				3220	// Altivec has a variety of "shuffle immediates" that take two vector inputs
				3221	// and produce a fixed permutation. If any of these match, do not lower to
				3222	// VPERM.
				3223	if (PPC::isVPKUWUMShuffleMask(PermMask.Val, false) \|\|
				3224	PPC::isVPKUHUMShuffleMask(PermMask.Val, false) \|\|
				3225	PPC::isVSLDOIShuffleMask(PermMask.Val, false) != -1 \|\|
				3226	PPC::isVMRGLShuffleMask(PermMask.Val, 1, false) \|\|
				3227	PPC::isVMRGLShuffleMask(PermMask.Val, 2, false) \|\|
				3228	PPC::isVMRGLShuffleMask(PermMask.Val, 4, false) \|\|
				3229	PPC::isVMRGHShuffleMask(PermMask.Val, 1, false) \|\|
				3230	PPC::isVMRGHShuffleMask(PermMask.Val, 2, false) \|\|
				3231	PPC::isVMRGHShuffleMask(PermMask.Val, 4, false))
				3232	return Op;
				3233
				3234	// Check to see if this is a shuffle of 4-byte values. If so, we can use our
				3235	// perfect shuffle table to emit an optimal matching sequence.
				3236	unsigned PFIndexes[4];
				3237	bool isFourElementShuffle = true;
				3238	for (unsigned i = 0; i != 4 && isFourElementShuffle; ++i) { // Element number
				3239	unsigned EltNo = 8; // Start out undef.
				3240	for (unsigned j = 0; j != 4; ++j) { // Intra-element byte.
				3241	if (PermMask.getOperand(i*4+j).getOpcode() == ISD::UNDEF)
				3242	continue; // Undef, ignore it.
				3243
				3244	unsigned ByteSource =
				3245	cast<ConstantSDNode>(PermMask.getOperand(i*4+j))->getValue();
				3246	if ((ByteSource & 3) != j) {
				3247	isFourElementShuffle = false;
				3248	break;
				3249	}
				3250
				3251	if (EltNo == 8) {
				3252	EltNo = ByteSource/4;
				3253	} else if (EltNo != ByteSource/4) {
				3254	isFourElementShuffle = false;
				3255	break;
				3256	}
				3257	}
				3258	PFIndexes[i] = EltNo;
				3259	}
				3260
				3261	// If this shuffle can be expressed as a shuffle of 4-byte elements, use the
				3262	// perfect shuffle vector to determine if it is cost effective to do this as
				3263	// discrete instructions, or whether we should use a vperm.
				3264	if (isFourElementShuffle) {
				3265	// Compute the index in the perfect shuffle table.
				3266	unsigned PFTableIndex =
				3267	PFIndexes[0]999+PFIndexes[1]99+PFIndexes[2]9+PFIndexes[3];
				3268
				3269	unsigned PFEntry = PerfectShuffleTable[PFTableIndex];
				3270	unsigned Cost = (PFEntry >> 30);
				3271
				3272	// Determining when to avoid vperm is tricky. Many things affect the cost
				3273	// of vperm, particularly how many times the perm mask needs to be computed.
				3274	// For example, if the perm mask can be hoisted out of a loop or is already
				3275	// used (perhaps because there are multiple permutes with the same shuffle
				3276	// mask?) the vperm has a cost of 1. OTOH, hoisting the permute mask out of
				3277	// the loop requires an extra register.
				3278	//
				3279	// As a compromise, we only emit discrete instructions if the shuffle can be
				3280	// generated in 3 or fewer operations. When we have loop information
				3281	// available, if this block is within a loop, we should avoid using vperm
				3282	// for 3-operation perms and use a constant pool load instead.
				3283	if (Cost < 3)
				3284	return GeneratePerfectShuffle(PFEntry, V1, V2, DAG);
				3285	}
				3286
				3287	// Lower this to a VPERM(V1, V2, V3) expression, where V3 is a constant
				3288	// vector that will get spilled to the constant pool.
				3289	if (V2.getOpcode() == ISD::UNDEF) V2 = V1;
				3290
				3291	// The SHUFFLE_VECTOR mask is almost exactly what we want for vperm, except
				3292	// that it is in input element units, not in bytes. Convert now.
				3293	MVT::ValueType EltVT = MVT::getVectorElementType(V1.getValueType());
				3294	unsigned BytesPerElement = MVT::getSizeInBits(EltVT)/8;
				3295
				3296	SmallVector<SDOperand, 16> ResultMask;
				3297	for (unsigned i = 0, e = PermMask.getNumOperands(); i != e; ++i) {
				3298	unsigned SrcElt;
				3299	if (PermMask.getOperand(i).getOpcode() == ISD::UNDEF)
				3300	SrcElt = 0;
				3301	else
				3302	SrcElt = cast<ConstantSDNode>(PermMask.getOperand(i))->getValue();
				3303
				3304	for (unsigned j = 0; j != BytesPerElement; ++j)
				3305	ResultMask.push_back(DAG.getConstant(SrcElt*BytesPerElement+j,
				3306	MVT::i8));
				3307	}
				3308
				3309	SDOperand VPermMask = DAG.getNode(ISD::BUILD_VECTOR, MVT::v16i8,
				3310	&ResultMask[0], ResultMask.size());
				3311	return DAG.getNode(PPCISD::VPERM, V1.getValueType(), V1, V2, VPermMask);
				3312	}
				3313
				3314	/// getAltivecCompareInfo - Given an intrinsic, return false if it is not an
				3315	/// altivec comparison. If it is, return true and fill in Opc/isDot with
				3316	/// information about the intrinsic.
				3317	static bool getAltivecCompareInfo(SDOperand Intrin, int &CompareOpc,
				3318	bool &isDot) {
				3319	unsigned IntrinsicID = cast<ConstantSDNode>(Intrin.getOperand(0))->getValue();
				3320	CompareOpc = -1;
				3321	isDot = false;
				3322	switch (IntrinsicID) {
				3323	default: return false;
				3324	// Comparison predicates.
				3325	case Intrinsic::ppc_altivec_vcmpbfp_p: CompareOpc = 966; isDot = 1; break;
				3326	case Intrinsic::ppc_altivec_vcmpeqfp_p: CompareOpc = 198; isDot = 1; break;
				3327	case Intrinsic::ppc_altivec_vcmpequb_p: CompareOpc = 6; isDot = 1; break;
				3328	case Intrinsic::ppc_altivec_vcmpequh_p: CompareOpc = 70; isDot = 1; break;
				3329	case Intrinsic::ppc_altivec_vcmpequw_p: CompareOpc = 134; isDot = 1; break;
				3330	case Intrinsic::ppc_altivec_vcmpgefp_p: CompareOpc = 454; isDot = 1; break;
				3331	case Intrinsic::ppc_altivec_vcmpgtfp_p: CompareOpc = 710; isDot = 1; break;
				3332	case Intrinsic::ppc_altivec_vcmpgtsb_p: CompareOpc = 774; isDot = 1; break;
				3333	case Intrinsic::ppc_altivec_vcmpgtsh_p: CompareOpc = 838; isDot = 1; break;
				3334	case Intrinsic::ppc_altivec_vcmpgtsw_p: CompareOpc = 902; isDot = 1; break;
				3335	case Intrinsic::ppc_altivec_vcmpgtub_p: CompareOpc = 518; isDot = 1; break;
				3336	case Intrinsic::ppc_altivec_vcmpgtuh_p: CompareOpc = 582; isDot = 1; break;
				3337	case Intrinsic::ppc_altivec_vcmpgtuw_p: CompareOpc = 646; isDot = 1; break;
				3338
				3339	// Normal Comparisons.
				3340	case Intrinsic::ppc_altivec_vcmpbfp: CompareOpc = 966; isDot = 0; break;
				3341	case Intrinsic::ppc_altivec_vcmpeqfp: CompareOpc = 198; isDot = 0; break;
				3342	case Intrinsic::ppc_altivec_vcmpequb: CompareOpc = 6; isDot = 0; break;
				3343	case Intrinsic::ppc_altivec_vcmpequh: CompareOpc = 70; isDot = 0; break;
				3344	case Intrinsic::ppc_altivec_vcmpequw: CompareOpc = 134; isDot = 0; break;
				3345	case Intrinsic::ppc_altivec_vcmpgefp: CompareOpc = 454; isDot = 0; break;
				3346	case Intrinsic::ppc_altivec_vcmpgtfp: CompareOpc = 710; isDot = 0; break;
				3347	case Intrinsic::ppc_altivec_vcmpgtsb: CompareOpc = 774; isDot = 0; break;
				3348	case Intrinsic::ppc_altivec_vcmpgtsh: CompareOpc = 838; isDot = 0; break;
				3349	case Intrinsic::ppc_altivec_vcmpgtsw: CompareOpc = 902; isDot = 0; break;
				3350	case Intrinsic::ppc_altivec_vcmpgtub: CompareOpc = 518; isDot = 0; break;
				3351	case Intrinsic::ppc_altivec_vcmpgtuh: CompareOpc = 582; isDot = 0; break;
				3352	case Intrinsic::ppc_altivec_vcmpgtuw: CompareOpc = 646; isDot = 0; break;
				3353	}
				3354	return true;
				3355	}
				3356
				3357	/// LowerINTRINSIC_WO_CHAIN - If this is an intrinsic that we want to custom
				3358	/// lower, do it, otherwise return null.
Dale Johannesen	8be83a7	2008-03-04 23:17:14 +0000	[diff] [blame]	3359	SDOperand PPCTargetLowering::LowerINTRINSIC_WO_CHAIN(SDOperand Op,
				3360	SelectionDAG &DAG) {
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	3361	// If this is a lowered altivec predicate compare, CompareOpc is set to the
				3362	// opcode number of the comparison.
				3363	int CompareOpc;
				3364	bool isDot;
				3365	if (!getAltivecCompareInfo(Op, CompareOpc, isDot))
				3366	return SDOperand(); // Don't custom lower most intrinsics.
				3367
				3368	// If this is a non-dot comparison, make the VCMP node and we are done.
				3369	if (!isDot) {
				3370	SDOperand Tmp = DAG.getNode(PPCISD::VCMP, Op.getOperand(2).getValueType(),
				3371	Op.getOperand(1), Op.getOperand(2),
				3372	DAG.getConstant(CompareOpc, MVT::i32));
				3373	return DAG.getNode(ISD::BIT_CONVERT, Op.getValueType(), Tmp);
				3374	}
				3375
				3376	// Create the PPCISD altivec 'dot' comparison node.
				3377	SDOperand Ops[] = {
				3378	Op.getOperand(2), // LHS
				3379	Op.getOperand(3), // RHS
				3380	DAG.getConstant(CompareOpc, MVT::i32)
				3381	};
				3382	std::vector<MVT::ValueType> VTs;
				3383	VTs.push_back(Op.getOperand(2).getValueType());
				3384	VTs.push_back(MVT::Flag);
				3385	SDOperand CompNode = DAG.getNode(PPCISD::VCMPo, VTs, Ops, 3);
				3386
				3387	// Now that we have the comparison, emit a copy from the CR to a GPR.
				3388	// This is flagged to the above dot comparison.
				3389	SDOperand Flags = DAG.getNode(PPCISD::MFCR, MVT::i32,
				3390	DAG.getRegister(PPC::CR6, MVT::i32),
				3391	CompNode.getValue(1));
				3392
				3393	// Unpack the result based on how the target uses it.
				3394	unsigned BitNo; // Bit # of CR6.
				3395	bool InvertBit; // Invert result?
				3396	switch (cast<ConstantSDNode>(Op.getOperand(1))->getValue()) {
				3397	default: // Can't happen, don't crash on invalid number though.
				3398	case 0: // Return the value of the EQ bit of CR6.
				3399	BitNo = 0; InvertBit = false;
				3400	break;
				3401	case 1: // Return the inverted value of the EQ bit of CR6.
				3402	BitNo = 0; InvertBit = true;
				3403	break;
				3404	case 2: // Return the value of the LT bit of CR6.
				3405	BitNo = 2; InvertBit = false;
				3406	break;
				3407	case 3: // Return the inverted value of the LT bit of CR6.
				3408	BitNo = 2; InvertBit = true;
				3409	break;
				3410	}
				3411
				3412	// Shift the bit into the low position.
				3413	Flags = DAG.getNode(ISD::SRL, MVT::i32, Flags,
				3414	DAG.getConstant(8-(3-BitNo), MVT::i32));
				3415	// Isolate the bit.
				3416	Flags = DAG.getNode(ISD::AND, MVT::i32, Flags,
				3417	DAG.getConstant(1, MVT::i32));
				3418
				3419	// If we are supposed to, toggle the bit.
				3420	if (InvertBit)
				3421	Flags = DAG.getNode(ISD::XOR, MVT::i32, Flags,
				3422	DAG.getConstant(1, MVT::i32));
				3423	return Flags;
				3424	}
				3425
Dale Johannesen	8be83a7	2008-03-04 23:17:14 +0000	[diff] [blame]	3426	SDOperand PPCTargetLowering::LowerSCALAR_TO_VECTOR(SDOperand Op,
				3427	SelectionDAG &DAG) {
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	3428	// Create a stack slot that is 16-byte aligned.
				3429	MachineFrameInfo *FrameInfo = DAG.getMachineFunction().getFrameInfo();
				3430	int FrameIdx = FrameInfo->CreateStackObject(16, 16);
				3431	MVT::ValueType PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
				3432	SDOperand FIdx = DAG.getFrameIndex(FrameIdx, PtrVT);
				3433
				3434	// Store the input value into Value#0 of the stack slot.
				3435	SDOperand Store = DAG.getStore(DAG.getEntryNode(),
				3436	Op.getOperand(0), FIdx, NULL, 0);
				3437	// Load it out.
				3438	return DAG.getLoad(Op.getValueType(), Store, FIdx, NULL, 0);
				3439	}
				3440
Dale Johannesen	8be83a7	2008-03-04 23:17:14 +0000	[diff] [blame]	3441	SDOperand PPCTargetLowering::LowerMUL(SDOperand Op, SelectionDAG &DAG) {
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	3442	if (Op.getValueType() == MVT::v4i32) {
				3443	SDOperand LHS = Op.getOperand(0), RHS = Op.getOperand(1);
				3444
				3445	SDOperand Zero = BuildSplatI( 0, 1, MVT::v4i32, DAG);
				3446	SDOperand Neg16 = BuildSplatI(-16, 4, MVT::v4i32, DAG); // +16 as shift amt.
				3447
				3448	SDOperand RHSSwap = // = vrlw RHS, 16
				3449	BuildIntrinsicOp(Intrinsic::ppc_altivec_vrlw, RHS, Neg16, DAG);
				3450
				3451	// Shrinkify inputs to v8i16.
				3452	LHS = DAG.getNode(ISD::BIT_CONVERT, MVT::v8i16, LHS);
				3453	RHS = DAG.getNode(ISD::BIT_CONVERT, MVT::v8i16, RHS);
				3454	RHSSwap = DAG.getNode(ISD::BIT_CONVERT, MVT::v8i16, RHSSwap);
				3455
				3456	// Low parts multiplied together, generating 32-bit results (we ignore the
				3457	// top parts).
				3458	SDOperand LoProd = BuildIntrinsicOp(Intrinsic::ppc_altivec_vmulouh,
				3459	LHS, RHS, DAG, MVT::v4i32);
				3460
				3461	SDOperand HiProd = BuildIntrinsicOp(Intrinsic::ppc_altivec_vmsumuhm,
				3462	LHS, RHSSwap, Zero, DAG, MVT::v4i32);
				3463	// Shift the high parts up 16 bits.
				3464	HiProd = BuildIntrinsicOp(Intrinsic::ppc_altivec_vslw, HiProd, Neg16, DAG);
				3465	return DAG.getNode(ISD::ADD, MVT::v4i32, LoProd, HiProd);
				3466	} else if (Op.getValueType() == MVT::v8i16) {
				3467	SDOperand LHS = Op.getOperand(0), RHS = Op.getOperand(1);
				3468
				3469	SDOperand Zero = BuildSplatI(0, 1, MVT::v8i16, DAG);
				3470
				3471	return BuildIntrinsicOp(Intrinsic::ppc_altivec_vmladduhm,
				3472	LHS, RHS, Zero, DAG);
				3473	} else if (Op.getValueType() == MVT::v16i8) {
				3474	SDOperand LHS = Op.getOperand(0), RHS = Op.getOperand(1);
				3475
				3476	// Multiply the even 8-bit parts, producing 16-bit sums.
				3477	SDOperand EvenParts = BuildIntrinsicOp(Intrinsic::ppc_altivec_vmuleub,
				3478	LHS, RHS, DAG, MVT::v8i16);
				3479	EvenParts = DAG.getNode(ISD::BIT_CONVERT, MVT::v16i8, EvenParts);
				3480
				3481	// Multiply the odd 8-bit parts, producing 16-bit sums.
				3482	SDOperand OddParts = BuildIntrinsicOp(Intrinsic::ppc_altivec_vmuloub,
				3483	LHS, RHS, DAG, MVT::v8i16);
				3484	OddParts = DAG.getNode(ISD::BIT_CONVERT, MVT::v16i8, OddParts);
				3485
				3486	// Merge the results together.
				3487	SDOperand Ops[16];
				3488	for (unsigned i = 0; i != 8; ++i) {
				3489	Ops[i2 ] = DAG.getConstant(2i+1, MVT::i8);
				3490	Ops[i2+1] = DAG.getConstant(2i+1+16, MVT::i8);
				3491	}
				3492	return DAG.getNode(ISD::VECTOR_SHUFFLE, MVT::v16i8, EvenParts, OddParts,
				3493	DAG.getNode(ISD::BUILD_VECTOR, MVT::v16i8, Ops, 16));
				3494	} else {
				3495	assert(0 && "Unknown mul to lower!");
				3496	abort();
				3497	}
				3498	}
				3499
				3500	/// LowerOperation - Provide custom lowering hooks for some operations.
				3501	///
				3502	SDOperand PPCTargetLowering::LowerOperation(SDOperand Op, SelectionDAG &DAG) {
				3503	switch (Op.getOpcode()) {
				3504	default: assert(0 && "Wasn't expecting to be able to lower this!");
				3505	case ISD::ConstantPool: return LowerConstantPool(Op, DAG);
				3506	case ISD::GlobalAddress: return LowerGlobalAddress(Op, DAG);
				3507	case ISD::GlobalTLSAddress: return LowerGlobalTLSAddress(Op, DAG);
				3508	case ISD::JumpTable: return LowerJumpTable(Op, DAG);
				3509	case ISD::SETCC: return LowerSETCC(Op, DAG);
				3510	case ISD::VASTART:
				3511	return LowerVASTART(Op, DAG, VarArgsFrameIndex, VarArgsStackOffset,
				3512	VarArgsNumGPR, VarArgsNumFPR, PPCSubTarget);
				3513
				3514	case ISD::VAARG:
				3515	return LowerVAARG(Op, DAG, VarArgsFrameIndex, VarArgsStackOffset,
				3516	VarArgsNumGPR, VarArgsNumFPR, PPCSubTarget);
				3517
				3518	case ISD::FORMAL_ARGUMENTS:
				3519	return LowerFORMAL_ARGUMENTS(Op, DAG, VarArgsFrameIndex,
				3520	VarArgsStackOffset, VarArgsNumGPR,
				3521	VarArgsNumFPR, PPCSubTarget);
				3522
				3523	case ISD::CALL: return LowerCALL(Op, DAG, PPCSubTarget);
				3524	case ISD::RET: return LowerRET(Op, DAG, getTargetMachine());
				3525	case ISD::STACKRESTORE: return LowerSTACKRESTORE(Op, DAG, PPCSubTarget);
				3526	case ISD::DYNAMIC_STACKALLOC:
				3527	return LowerDYNAMIC_STACKALLOC(Op, DAG, PPCSubTarget);
				3528
				3529	case ISD::SELECT_CC: return LowerSELECT_CC(Op, DAG);
				3530	case ISD::FP_TO_SINT: return LowerFP_TO_SINT(Op, DAG);
				3531	case ISD::SINT_TO_FP: return LowerSINT_TO_FP(Op, DAG);
Dale Johannesen	3d8578b	2007-10-10 01:01:31 +0000	[diff] [blame]	3532	case ISD::FP_ROUND_INREG: return LowerFP_ROUND_INREG(Op, DAG);
Dan Gohman	819574c	2008-01-31 00:41:03 +0000	[diff] [blame]	3533	case ISD::FLT_ROUNDS_: return LowerFLT_ROUNDS_(Op, DAG);
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	3534
				3535	// Lower 64-bit shifts.
				3536	case ISD::SHL_PARTS: return LowerSHL_PARTS(Op, DAG);
				3537	case ISD::SRL_PARTS: return LowerSRL_PARTS(Op, DAG);
				3538	case ISD::SRA_PARTS: return LowerSRA_PARTS(Op, DAG);
				3539
				3540	// Vector-related lowering.
				3541	case ISD::BUILD_VECTOR: return LowerBUILD_VECTOR(Op, DAG);
				3542	case ISD::VECTOR_SHUFFLE: return LowerVECTOR_SHUFFLE(Op, DAG);
				3543	case ISD::INTRINSIC_WO_CHAIN: return LowerINTRINSIC_WO_CHAIN(Op, DAG);
				3544	case ISD::SCALAR_TO_VECTOR: return LowerSCALAR_TO_VECTOR(Op, DAG);
				3545	case ISD::MUL: return LowerMUL(Op, DAG);
				3546
Chris Lattner	f8b9337	2007-12-08 06:59:59 +0000	[diff] [blame]	3547	// Frame & Return address.
				3548	case ISD::RETURNADDR: return LowerRETURNADDR(Op, DAG);
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	3549	case ISD::FRAMEADDR: return LowerFRAMEADDR(Op, DAG);
				3550	}
				3551	return SDOperand();
				3552	}
				3553
Chris Lattner	2877109	2007-11-28 18:44:47 +0000	[diff] [blame]	3554	SDNode PPCTargetLowering::ExpandOperationResult(SDNode N, SelectionDAG &DAG) {
				3555	switch (N->getOpcode()) {
				3556	default: assert(0 && "Wasn't expecting to be able to lower this!");
				3557	case ISD::FP_TO_SINT: return LowerFP_TO_SINT(SDOperand(N, 0), DAG).Val;
				3558	}
				3559	}
				3560
				3561
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	3562	//===----------------------------------------------------------------------===//
				3563	// Other Lowering Code
				3564	//===----------------------------------------------------------------------===//
				3565
				3566	MachineBasicBlock *
Evan Cheng	e637db1	2008-01-30 18:18:23 +0000	[diff] [blame]	3567	PPCTargetLowering::EmitInstrWithCustomInserter(MachineInstr *MI,
				3568	MachineBasicBlock *BB) {
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	3569	const TargetInstrInfo *TII = getTargetMachine().getInstrInfo();
				3570	assert((MI->getOpcode() == PPC::SELECT_CC_I4 \|\|
				3571	MI->getOpcode() == PPC::SELECT_CC_I8 \|\|
				3572	MI->getOpcode() == PPC::SELECT_CC_F4 \|\|
				3573	MI->getOpcode() == PPC::SELECT_CC_F8 \|\|
				3574	MI->getOpcode() == PPC::SELECT_CC_VRRC) &&
				3575	"Unexpected instr type to insert");
				3576
				3577	// To "insert" a SELECT_CC instruction, we actually have to insert the diamond
				3578	// control-flow pattern. The incoming instruction knows the destination vreg
				3579	// to set, the condition code register to branch on, the true/false values to
				3580	// select between, and a branch opcode to use.
				3581	const BasicBlock *LLVM_BB = BB->getBasicBlock();
				3582	ilist<MachineBasicBlock>::iterator It = BB;
				3583	++It;
				3584
				3585	// thisMBB:
				3586	// ...
				3587	// TrueVal = ...
				3588	// cmpTY ccX, r1, r2
				3589	// bCC copy1MBB
				3590	// fallthrough --> copy0MBB
				3591	MachineBasicBlock *thisMBB = BB;
				3592	MachineBasicBlock *copy0MBB = new MachineBasicBlock(LLVM_BB);
				3593	MachineBasicBlock *sinkMBB = new MachineBasicBlock(LLVM_BB);
				3594	unsigned SelectPred = MI->getOperand(4).getImm();
				3595	BuildMI(BB, TII->get(PPC::BCC))
				3596	.addImm(SelectPred).addReg(MI->getOperand(1).getReg()).addMBB(sinkMBB);
				3597	MachineFunction *F = BB->getParent();
				3598	F->getBasicBlockList().insert(It, copy0MBB);
				3599	F->getBasicBlockList().insert(It, sinkMBB);
				3600	// Update machine-CFG edges by first adding all successors of the current
				3601	// block to the new block which will contain the Phi node for the select.
				3602	for(MachineBasicBlock::succ_iterator i = BB->succ_begin(),
				3603	e = BB->succ_end(); i != e; ++i)
				3604	sinkMBB->addSuccessor(*i);
				3605	// Next, remove all successors of the current block, and add the true
				3606	// and fallthrough blocks as its successors.
				3607	while(!BB->succ_empty())
				3608	BB->removeSuccessor(BB->succ_begin());
				3609	BB->addSuccessor(copy0MBB);
				3610	BB->addSuccessor(sinkMBB);
				3611
				3612	// copy0MBB:
				3613	// %FalseValue = ...
				3614	// # fallthrough to sinkMBB
				3615	BB = copy0MBB;
				3616
				3617	// Update machine-CFG edges
				3618	BB->addSuccessor(sinkMBB);
				3619
				3620	// sinkMBB:
				3621	// %Result = phi [ %FalseValue, copy0MBB ], [ %TrueValue, thisMBB ]
				3622	// ...
				3623	BB = sinkMBB;
				3624	BuildMI(BB, TII->get(PPC::PHI), MI->getOperand(0).getReg())
				3625	.addReg(MI->getOperand(3).getReg()).addMBB(copy0MBB)
				3626	.addReg(MI->getOperand(2).getReg()).addMBB(thisMBB);
				3627
				3628	delete MI; // The pseudo instruction is gone now.
				3629	return BB;
				3630	}
				3631
				3632	//===----------------------------------------------------------------------===//
				3633	// Target Optimization Hooks
				3634	//===----------------------------------------------------------------------===//
				3635
				3636	SDOperand PPCTargetLowering::PerformDAGCombine(SDNode *N,
				3637	DAGCombinerInfo &DCI) const {
				3638	TargetMachine &TM = getTargetMachine();
				3639	SelectionDAG &DAG = DCI.DAG;
				3640	switch (N->getOpcode()) {
				3641	default: break;
				3642	case PPCISD::SHL:
				3643	if (ConstantSDNode *C = dyn_cast<ConstantSDNode>(N->getOperand(0))) {
				3644	if (C->getValue() == 0) // 0 << V -> 0.
				3645	return N->getOperand(0);
				3646	}
				3647	break;
				3648	case PPCISD::SRL:
				3649	if (ConstantSDNode *C = dyn_cast<ConstantSDNode>(N->getOperand(0))) {
				3650	if (C->getValue() == 0) // 0 >>u V -> 0.
				3651	return N->getOperand(0);
				3652	}
				3653	break;
				3654	case PPCISD::SRA:
				3655	if (ConstantSDNode *C = dyn_cast<ConstantSDNode>(N->getOperand(0))) {
				3656	if (C->getValue() == 0 \|\| // 0 >>s V -> 0.
				3657	C->isAllOnesValue()) // -1 >>s V -> -1.
				3658	return N->getOperand(0);
				3659	}
				3660	break;
				3661
				3662	case ISD::SINT_TO_FP:
				3663	if (TM.getSubtarget<PPCSubtarget>().has64BitSupport()) {
				3664	if (N->getOperand(0).getOpcode() == ISD::FP_TO_SINT) {
				3665	// Turn (sint_to_fp (fp_to_sint X)) -> fctidz/fcfid without load/stores.
				3666	// We allow the src/dst to be either f32/f64, but the intermediate
				3667	// type must be i64.
Dale Johannesen	cbc0351	2007-10-23 23:20:14 +0000	[diff] [blame]	3668	if (N->getOperand(0).getValueType() == MVT::i64 &&
				3669	N->getOperand(0).getOperand(0).getValueType() != MVT::ppcf128) {
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	3670	SDOperand Val = N->getOperand(0).getOperand(0);
				3671	if (Val.getValueType() == MVT::f32) {
				3672	Val = DAG.getNode(ISD::FP_EXTEND, MVT::f64, Val);
				3673	DCI.AddToWorklist(Val.Val);
				3674	}
				3675
				3676	Val = DAG.getNode(PPCISD::FCTIDZ, MVT::f64, Val);
				3677	DCI.AddToWorklist(Val.Val);
				3678	Val = DAG.getNode(PPCISD::FCFID, MVT::f64, Val);
				3679	DCI.AddToWorklist(Val.Val);
				3680	if (N->getValueType(0) == MVT::f32) {
Chris Lattner	5872a36	2008-01-17 07:00:52 +0000	[diff] [blame]	3681	Val = DAG.getNode(ISD::FP_ROUND, MVT::f32, Val,
				3682	DAG.getIntPtrConstant(0));
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	3683	DCI.AddToWorklist(Val.Val);
				3684	}
				3685	return Val;
				3686	} else if (N->getOperand(0).getValueType() == MVT::i32) {
				3687	// If the intermediate type is i32, we can avoid the load/store here
				3688	// too.
				3689	}
				3690	}
				3691	}
				3692	break;
				3693	case ISD::STORE:
				3694	// Turn STORE (FP_TO_SINT F) -> STFIWX(FCTIWZ(F)).
				3695	if (TM.getSubtarget<PPCSubtarget>().hasSTFIWX() &&
Chris Lattner	df7a4ae	2008-01-18 16:54:56 +0000	[diff] [blame]	3696	!cast<StoreSDNode>(N)->isTruncatingStore() &&
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	3697	N->getOperand(1).getOpcode() == ISD::FP_TO_SINT &&
Dale Johannesen	cbc0351	2007-10-23 23:20:14 +0000	[diff] [blame]	3698	N->getOperand(1).getValueType() == MVT::i32 &&
				3699	N->getOperand(1).getOperand(0).getValueType() != MVT::ppcf128) {
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	3700	SDOperand Val = N->getOperand(1).getOperand(0);
				3701	if (Val.getValueType() == MVT::f32) {
				3702	Val = DAG.getNode(ISD::FP_EXTEND, MVT::f64, Val);
				3703	DCI.AddToWorklist(Val.Val);
				3704	}
				3705	Val = DAG.getNode(PPCISD::FCTIWZ, MVT::f64, Val);
				3706	DCI.AddToWorklist(Val.Val);
				3707
				3708	Val = DAG.getNode(PPCISD::STFIWX, MVT::Other, N->getOperand(0), Val,
				3709	N->getOperand(2), N->getOperand(3));
				3710	DCI.AddToWorklist(Val.Val);
				3711	return Val;
				3712	}
				3713
				3714	// Turn STORE (BSWAP) -> sthbrx/stwbrx.
				3715	if (N->getOperand(1).getOpcode() == ISD::BSWAP &&
				3716	N->getOperand(1).Val->hasOneUse() &&
				3717	(N->getOperand(1).getValueType() == MVT::i32 \|\|
				3718	N->getOperand(1).getValueType() == MVT::i16)) {
				3719	SDOperand BSwapOp = N->getOperand(1).getOperand(0);
				3720	// Do an any-extend to 32-bits if this is a half-word input.
				3721	if (BSwapOp.getValueType() == MVT::i16)
				3722	BSwapOp = DAG.getNode(ISD::ANY_EXTEND, MVT::i32, BSwapOp);
				3723
				3724	return DAG.getNode(PPCISD::STBRX, MVT::Other, N->getOperand(0), BSwapOp,
				3725	N->getOperand(2), N->getOperand(3),
				3726	DAG.getValueType(N->getOperand(1).getValueType()));
				3727	}
				3728	break;
				3729	case ISD::BSWAP:
				3730	// Turn BSWAP (LOAD) -> lhbrx/lwbrx.
				3731	if (ISD::isNON_EXTLoad(N->getOperand(0).Val) &&
				3732	N->getOperand(0).hasOneUse() &&
				3733	(N->getValueType(0) == MVT::i32 \|\| N->getValueType(0) == MVT::i16)) {
				3734	SDOperand Load = N->getOperand(0);
				3735	LoadSDNode *LD = cast<LoadSDNode>(Load);
				3736	// Create the byte-swapping load.
				3737	std::vector<MVT::ValueType> VTs;
				3738	VTs.push_back(MVT::i32);
				3739	VTs.push_back(MVT::Other);
Dan Gohman	12a9c08	2008-02-06 22:27:42 +0000	[diff] [blame]	3740	SDOperand MO = DAG.getMemOperand(LD->getMemOperand());
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	3741	SDOperand Ops[] = {
				3742	LD->getChain(), // Chain
				3743	LD->getBasePtr(), // Ptr
Dan Gohman	12a9c08	2008-02-06 22:27:42 +0000	[diff] [blame]	3744	MO, // MemOperand
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	3745	DAG.getValueType(N->getValueType(0)) // VT
				3746	};
				3747	SDOperand BSLoad = DAG.getNode(PPCISD::LBRX, VTs, Ops, 4);
				3748
				3749	// If this is an i16 load, insert the truncate.
				3750	SDOperand ResVal = BSLoad;
				3751	if (N->getValueType(0) == MVT::i16)
				3752	ResVal = DAG.getNode(ISD::TRUNCATE, MVT::i16, BSLoad);
				3753
				3754	// First, combine the bswap away. This makes the value produced by the
				3755	// load dead.
				3756	DCI.CombineTo(N, ResVal);
				3757
				3758	// Next, combine the load away, we give it a bogus result value but a real
				3759	// chain result. The result value is dead because the bswap is dead.
				3760	DCI.CombineTo(Load.Val, ResVal, BSLoad.getValue(1));
				3761
				3762	// Return N so it doesn't get rechecked!
				3763	return SDOperand(N, 0);
				3764	}
				3765
				3766	break;
				3767	case PPCISD::VCMP: {
				3768	// If a VCMPo node already exists with exactly the same operands as this
				3769	// node, use its result instead of this node (VCMPo computes both a CR6 and
				3770	// a normal output).
				3771	//
				3772	if (!N->getOperand(0).hasOneUse() &&
				3773	!N->getOperand(1).hasOneUse() &&
				3774	!N->getOperand(2).hasOneUse()) {
				3775
				3776	// Scan all of the users of the LHS, looking for VCMPo's that match.
				3777	SDNode *VCMPoNode = 0;
				3778
				3779	SDNode *LHSN = N->getOperand(0).Val;
				3780	for (SDNode::use_iterator UI = LHSN->use_begin(), E = LHSN->use_end();
				3781	UI != E; ++UI)
				3782	if ((*UI)->getOpcode() == PPCISD::VCMPo &&
				3783	(*UI)->getOperand(1) == N->getOperand(1) &&
				3784	(*UI)->getOperand(2) == N->getOperand(2) &&
				3785	(*UI)->getOperand(0) == N->getOperand(0)) {
				3786	VCMPoNode = *UI;
				3787	break;
				3788	}
				3789
				3790	// If there is no VCMPo node, or if the flag value has a single use, don't
				3791	// transform this.
				3792	if (!VCMPoNode \|\| VCMPoNode->hasNUsesOfValue(0, 1))
				3793	break;
				3794
				3795	// Look at the (necessarily single) use of the flag value. If it has a
				3796	// chain, this transformation is more complex. Note that multiple things
				3797	// could use the value result, which we should ignore.
				3798	SDNode *FlagUser = 0;
				3799	for (SDNode::use_iterator UI = VCMPoNode->use_begin();
				3800	FlagUser == 0; ++UI) {
				3801	assert(UI != VCMPoNode->use_end() && "Didn't find user!");
				3802	SDNode User = UI;
				3803	for (unsigned i = 0, e = User->getNumOperands(); i != e; ++i) {
				3804	if (User->getOperand(i) == SDOperand(VCMPoNode, 1)) {
				3805	FlagUser = User;
				3806	break;
				3807	}
				3808	}
				3809	}
				3810
				3811	// If the user is a MFCR instruction, we know this is safe. Otherwise we
				3812	// give up for right now.
				3813	if (FlagUser->getOpcode() == PPCISD::MFCR)
				3814	return SDOperand(VCMPoNode, 0);
				3815	}
				3816	break;
				3817	}
				3818	case ISD::BR_CC: {
				3819	// If this is a branch on an altivec predicate comparison, lower this so
				3820	// that we don't have to do a MFCR: instead, branch directly on CR6. This
				3821	// lowering is done pre-legalize, because the legalizer lowers the predicate
				3822	// compare down to code that is difficult to reassemble.
				3823	ISD::CondCode CC = cast<CondCodeSDNode>(N->getOperand(1))->get();
				3824	SDOperand LHS = N->getOperand(2), RHS = N->getOperand(3);
				3825	int CompareOpc;
				3826	bool isDot;
				3827
				3828	if (LHS.getOpcode() == ISD::INTRINSIC_WO_CHAIN &&
				3829	isa<ConstantSDNode>(RHS) && (CC == ISD::SETEQ \|\| CC == ISD::SETNE) &&
				3830	getAltivecCompareInfo(LHS, CompareOpc, isDot)) {
				3831	assert(isDot && "Can't compare against a vector result!");
				3832
				3833	// If this is a comparison against something other than 0/1, then we know
				3834	// that the condition is never/always true.
				3835	unsigned Val = cast<ConstantSDNode>(RHS)->getValue();
				3836	if (Val != 0 && Val != 1) {
				3837	if (CC == ISD::SETEQ) // Cond never true, remove branch.
				3838	return N->getOperand(0);
				3839	// Always !=, turn it into an unconditional branch.
				3840	return DAG.getNode(ISD::BR, MVT::Other,
				3841	N->getOperand(0), N->getOperand(4));
				3842	}
				3843
				3844	bool BranchOnWhenPredTrue = (CC == ISD::SETEQ) ^ (Val == 0);
				3845
				3846	// Create the PPCISD altivec 'dot' comparison node.
				3847	std::vector<MVT::ValueType> VTs;
				3848	SDOperand Ops[] = {
				3849	LHS.getOperand(2), // LHS of compare
				3850	LHS.getOperand(3), // RHS of compare
				3851	DAG.getConstant(CompareOpc, MVT::i32)
				3852	};
				3853	VTs.push_back(LHS.getOperand(2).getValueType());
				3854	VTs.push_back(MVT::Flag);
				3855	SDOperand CompNode = DAG.getNode(PPCISD::VCMPo, VTs, Ops, 3);
				3856
				3857	// Unpack the result based on how the target uses it.
				3858	PPC::Predicate CompOpc;
				3859	switch (cast<ConstantSDNode>(LHS.getOperand(1))->getValue()) {
				3860	default: // Can't happen, don't crash on invalid number though.
				3861	case 0: // Branch on the value of the EQ bit of CR6.
				3862	CompOpc = BranchOnWhenPredTrue ? PPC::PRED_EQ : PPC::PRED_NE;
				3863	break;
				3864	case 1: // Branch on the inverted value of the EQ bit of CR6.
				3865	CompOpc = BranchOnWhenPredTrue ? PPC::PRED_NE : PPC::PRED_EQ;
				3866	break;
				3867	case 2: // Branch on the value of the LT bit of CR6.
				3868	CompOpc = BranchOnWhenPredTrue ? PPC::PRED_LT : PPC::PRED_GE;
				3869	break;
				3870	case 3: // Branch on the inverted value of the LT bit of CR6.
				3871	CompOpc = BranchOnWhenPredTrue ? PPC::PRED_GE : PPC::PRED_LT;
				3872	break;
				3873	}
				3874
				3875	return DAG.getNode(PPCISD::COND_BRANCH, MVT::Other, N->getOperand(0),
				3876	DAG.getConstant(CompOpc, MVT::i32),
				3877	DAG.getRegister(PPC::CR6, MVT::i32),
				3878	N->getOperand(4), CompNode.getValue(1));
				3879	}
				3880	break;
				3881	}
				3882	}
				3883
				3884	return SDOperand();
				3885	}
				3886
				3887	//===----------------------------------------------------------------------===//
				3888	// Inline Assembly Support
				3889	//===----------------------------------------------------------------------===//
				3890
				3891	void PPCTargetLowering::computeMaskedBitsForTargetNode(const SDOperand Op,
Dan Gohman	d0dfc77	2008-02-13 22:28:48 +0000	[diff] [blame]	3892	const APInt &Mask,
Dan Gohman	229fa05	2008-02-13 00:35:47 +0000	[diff] [blame]	3893	APInt &KnownZero,
				3894	APInt &KnownOne,
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	3895	const SelectionDAG &DAG,
				3896	unsigned Depth) const {
Dan Gohman	229fa05	2008-02-13 00:35:47 +0000	[diff] [blame]	3897	KnownZero = KnownOne = APInt(Mask.getBitWidth(), 0);
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	3898	switch (Op.getOpcode()) {
				3899	default: break;
				3900	case PPCISD::LBRX: {
				3901	// lhbrx is known to have the top bits cleared out.
				3902	if (cast<VTSDNode>(Op.getOperand(3))->getVT() == MVT::i16)
				3903	KnownZero = 0xFFFF0000;
				3904	break;
				3905	}
				3906	case ISD::INTRINSIC_WO_CHAIN: {
				3907	switch (cast<ConstantSDNode>(Op.getOperand(0))->getValue()) {
				3908	default: break;
				3909	case Intrinsic::ppc_altivec_vcmpbfp_p:
				3910	case Intrinsic::ppc_altivec_vcmpeqfp_p:
				3911	case Intrinsic::ppc_altivec_vcmpequb_p:
				3912	case Intrinsic::ppc_altivec_vcmpequh_p:
				3913	case Intrinsic::ppc_altivec_vcmpequw_p:
				3914	case Intrinsic::ppc_altivec_vcmpgefp_p:
				3915	case Intrinsic::ppc_altivec_vcmpgtfp_p:
				3916	case Intrinsic::ppc_altivec_vcmpgtsb_p:
				3917	case Intrinsic::ppc_altivec_vcmpgtsh_p:
				3918	case Intrinsic::ppc_altivec_vcmpgtsw_p:
				3919	case Intrinsic::ppc_altivec_vcmpgtub_p:
				3920	case Intrinsic::ppc_altivec_vcmpgtuh_p:
				3921	case Intrinsic::ppc_altivec_vcmpgtuw_p:
				3922	KnownZero = ~1U; // All bits but the low one are known to be zero.
				3923	break;
				3924	}
				3925	}
				3926	}
				3927	}
				3928
				3929
				3930	/// getConstraintType - Given a constraint, return the type of
				3931	/// constraint it is for this target.
				3932	PPCTargetLowering::ConstraintType
				3933	PPCTargetLowering::getConstraintType(const std::string &Constraint) const {
				3934	if (Constraint.size() == 1) {
				3935	switch (Constraint[0]) {
				3936	default: break;
				3937	case 'b':
				3938	case 'r':
				3939	case 'f':
				3940	case 'v':
				3941	case 'y':
				3942	return C_RegisterClass;
				3943	}
				3944	}
				3945	return TargetLowering::getConstraintType(Constraint);
				3946	}
				3947
				3948	std::pair<unsigned, const TargetRegisterClass*>
				3949	PPCTargetLowering::getRegForInlineAsmConstraint(const std::string &Constraint,
				3950	MVT::ValueType VT) const {
				3951	if (Constraint.size() == 1) {
				3952	// GCC RS6000 Constraint Letters
				3953	switch (Constraint[0]) {
				3954	case 'b': // R1-R31
				3955	case 'r': // R0-R31
				3956	if (VT == MVT::i64 && PPCSubTarget.isPPC64())
				3957	return std::make_pair(0U, PPC::G8RCRegisterClass);
				3958	return std::make_pair(0U, PPC::GPRCRegisterClass);
				3959	case 'f':
				3960	if (VT == MVT::f32)
				3961	return std::make_pair(0U, PPC::F4RCRegisterClass);
				3962	else if (VT == MVT::f64)
				3963	return std::make_pair(0U, PPC::F8RCRegisterClass);
				3964	break;
				3965	case 'v':
				3966	return std::make_pair(0U, PPC::VRRCRegisterClass);
				3967	case 'y': // crrc
				3968	return std::make_pair(0U, PPC::CRRCRegisterClass);
				3969	}
				3970	}
				3971
				3972	return TargetLowering::getRegForInlineAsmConstraint(Constraint, VT);
				3973	}
				3974
				3975
Chris Lattner	a531abc	2007-08-25 00:47:38 +0000	[diff] [blame]	3976	/// LowerAsmOperandForConstraint - Lower the specified operand into the Ops
				3977	/// vector. If it is invalid, don't add anything to Ops.
				3978	void PPCTargetLowering::LowerAsmOperandForConstraint(SDOperand Op, char Letter,
				3979	std::vector<SDOperand>&Ops,
				3980	SelectionDAG &DAG) {
				3981	SDOperand Result(0,0);
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	3982	switch (Letter) {
				3983	default: break;
				3984	case 'I':
				3985	case 'J':
				3986	case 'K':
				3987	case 'L':
				3988	case 'M':
				3989	case 'N':
				3990	case 'O':
				3991	case 'P': {
				3992	ConstantSDNode *CST = dyn_cast<ConstantSDNode>(Op);
Chris Lattner	a531abc	2007-08-25 00:47:38 +0000	[diff] [blame]	3993	if (!CST) return; // Must be an immediate to match.
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	3994	unsigned Value = CST->getValue();
				3995	switch (Letter) {
				3996	default: assert(0 && "Unknown constraint letter!");
				3997	case 'I': // "I" is a signed 16-bit constant.
				3998	if ((short)Value == (int)Value)
Chris Lattner	a531abc	2007-08-25 00:47:38 +0000	[diff] [blame]	3999	Result = DAG.getTargetConstant(Value, Op.getValueType());
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	4000	break;
				4001	case 'J': // "J" is a constant with only the high-order 16 bits nonzero.
				4002	case 'L': // "L" is a signed 16-bit constant shifted left 16 bits.
				4003	if ((short)Value == 0)
Chris Lattner	a531abc	2007-08-25 00:47:38 +0000	[diff] [blame]	4004	Result = DAG.getTargetConstant(Value, Op.getValueType());
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	4005	break;
				4006	case 'K': // "K" is a constant with only the low-order 16 bits nonzero.
				4007	if ((Value >> 16) == 0)
Chris Lattner	a531abc	2007-08-25 00:47:38 +0000	[diff] [blame]	4008	Result = DAG.getTargetConstant(Value, Op.getValueType());
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	4009	break;
				4010	case 'M': // "M" is a constant that is greater than 31.
				4011	if (Value > 31)
Chris Lattner	a531abc	2007-08-25 00:47:38 +0000	[diff] [blame]	4012	Result = DAG.getTargetConstant(Value, Op.getValueType());
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	4013	break;
				4014	case 'N': // "N" is a positive constant that is an exact power of two.
				4015	if ((int)Value > 0 && isPowerOf2_32(Value))
Chris Lattner	a531abc	2007-08-25 00:47:38 +0000	[diff] [blame]	4016	Result = DAG.getTargetConstant(Value, Op.getValueType());
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	4017	break;
				4018	case 'O': // "O" is the constant zero.
				4019	if (Value == 0)
Chris Lattner	a531abc	2007-08-25 00:47:38 +0000	[diff] [blame]	4020	Result = DAG.getTargetConstant(Value, Op.getValueType());
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	4021	break;
				4022	case 'P': // "P" is a constant whose negation is a signed 16-bit constant.
				4023	if ((short)-Value == (int)-Value)
Chris Lattner	a531abc	2007-08-25 00:47:38 +0000	[diff] [blame]	4024	Result = DAG.getTargetConstant(Value, Op.getValueType());
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	4025	break;
				4026	}
				4027	break;
				4028	}
				4029	}
				4030
Chris Lattner	a531abc	2007-08-25 00:47:38 +0000	[diff] [blame]	4031	if (Result.Val) {
				4032	Ops.push_back(Result);
				4033	return;
				4034	}
				4035
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	4036	// Handle standard constraint letters.
Chris Lattner	a531abc	2007-08-25 00:47:38 +0000	[diff] [blame]	4037	TargetLowering::LowerAsmOperandForConstraint(Op, Letter, Ops, DAG);
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	4038	}
				4039
				4040	// isLegalAddressingMode - Return true if the addressing mode represented
				4041	// by AM is legal for this target, for a load/store of the specified type.
				4042	bool PPCTargetLowering::isLegalAddressingMode(const AddrMode &AM,
				4043	const Type *Ty) const {
				4044	// FIXME: PPC does not allow r+i addressing modes for vectors!
				4045
				4046	// PPC allows a sign-extended 16-bit immediate field.
				4047	if (AM.BaseOffs <= -(1LL << 16) \|\| AM.BaseOffs >= (1LL << 16)-1)
				4048	return false;
				4049
				4050	// No global is ever allowed as a base.
				4051	if (AM.BaseGV)
				4052	return false;
				4053
				4054	// PPC only support r+r,
				4055	switch (AM.Scale) {
				4056	case 0: // "r+i" or just "i", depending on HasBaseReg.
				4057	break;
				4058	case 1:
				4059	if (AM.HasBaseReg && AM.BaseOffs) // "r+r+i" is not allowed.
				4060	return false;
				4061	// Otherwise we have r+r or r+i.
				4062	break;
				4063	case 2:
				4064	if (AM.HasBaseReg \|\| AM.BaseOffs) // 2r+r or 2r+i is not allowed.
				4065	return false;
				4066	// Allow 2*r as r+r.
				4067	break;
				4068	default:
				4069	// No other scales are supported.
				4070	return false;
				4071	}
				4072
				4073	return true;
				4074	}
				4075
				4076	/// isLegalAddressImmediate - Return true if the integer value can be used
				4077	/// as the offset of the target addressing mode for load / store of the
				4078	/// given type.
				4079	bool PPCTargetLowering::isLegalAddressImmediate(int64_t V,const Type *Ty) const{
				4080	// PPC allows a sign-extended 16-bit immediate field.
				4081	return (V > -(1 << 16) && V < (1 << 16)-1);
				4082	}
				4083
				4084	bool PPCTargetLowering::isLegalAddressImmediate(llvm::GlobalValue* GV) const {
				4085	return false;
				4086	}
				4087
Chris Lattner	f8b9337	2007-12-08 06:59:59 +0000	[diff] [blame]	4088	SDOperand PPCTargetLowering::LowerRETURNADDR(SDOperand Op, SelectionDAG &DAG) {
				4089	// Depths > 0 not supported yet!
				4090	if (cast<ConstantSDNode>(Op.getOperand(0))->getValue() > 0)
				4091	return SDOperand();
				4092
				4093	MachineFunction &MF = DAG.getMachineFunction();
				4094	PPCFunctionInfo *FuncInfo = MF.getInfo<PPCFunctionInfo>();
				4095	int RAIdx = FuncInfo->getReturnAddrSaveIndex();
				4096	if (RAIdx == 0) {
				4097	bool isPPC64 = PPCSubTarget.isPPC64();
				4098	int Offset =
				4099	PPCFrameInfo::getReturnSaveOffset(isPPC64, PPCSubTarget.isMachoABI());
				4100
				4101	// Set up a frame object for the return address.
				4102	RAIdx = MF.getFrameInfo()->CreateFixedObject(isPPC64 ? 8 : 4, Offset);
				4103
				4104	// Remember it for next time.
				4105	FuncInfo->setReturnAddrSaveIndex(RAIdx);
				4106
				4107	// Make sure the function really does not optimize away the store of the RA
				4108	// to the stack.
				4109	FuncInfo->setLRStoreRequired();
				4110	}
				4111
				4112	// Just load the return address off the stack.
				4113	SDOperand RetAddrFI = DAG.getFrameIndex(RAIdx, getPointerTy());
				4114	return DAG.getLoad(getPointerTy(), DAG.getEntryNode(), RetAddrFI, NULL, 0);
				4115	}
				4116
				4117	SDOperand PPCTargetLowering::LowerFRAMEADDR(SDOperand Op, SelectionDAG &DAG) {
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	4118	// Depths > 0 not supported yet!
				4119	if (cast<ConstantSDNode>(Op.getOperand(0))->getValue() > 0)
				4120	return SDOperand();
				4121
				4122	MVT::ValueType PtrVT = DAG.getTargetLoweringInfo().getPointerTy();
				4123	bool isPPC64 = PtrVT == MVT::i64;
				4124
				4125	MachineFunction &MF = DAG.getMachineFunction();
				4126	MachineFrameInfo *MFI = MF.getFrameInfo();
				4127	bool is31 = (NoFramePointerElim \|\| MFI->hasVarSizedObjects())
				4128	&& MFI->getStackSize();
				4129
				4130	if (isPPC64)
				4131	return DAG.getCopyFromReg(DAG.getEntryNode(), is31 ? PPC::X31 : PPC::X1,
Bill Wendling	5e28ab1	2007-08-30 00:59:19 +0000	[diff] [blame]	4132	MVT::i64);
Dan Gohman	f17a25c	2007-07-18 16:29:46 +0000	[diff] [blame]	4133	else
				4134	return DAG.getCopyFromReg(DAG.getEntryNode(), is31 ? PPC::R31 : PPC::R1,
				4135	MVT::i32);
				4136	}