Blame - lib/CodeGen/SelectionDAG/SelectionDAGBuild.cpp - platform/external/llvm

blob: 853e0549f75db15d8b1f46389bb7ac070109f60c [file] [log] [blame]

Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	1	//===-- SelectionDAGBuild.cpp - Selection-DAG building --------------------===//
				2	//
				3	// The LLVM Compiler Infrastructure
				4	//
				5	// This file is distributed under the University of Illinois Open Source
				6	// License. See LICENSE.TXT for details.
				7	//
				8	//===----------------------------------------------------------------------===//
				9	//
				10	// This implements routines for translating from LLVM IR into SelectionDAG IR.
				11	//
				12	//===----------------------------------------------------------------------===//
				13
				14	#define DEBUG_TYPE "isel"
				15	#include "SelectionDAGBuild.h"
				16	#include "llvm/ADT/BitVector.h"
Dan Gohman	5b22980	2008-09-04 20:49:27 +0000	[diff] [blame]	17	#include "llvm/ADT/SmallSet.h"
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	18	#include "llvm/Analysis/AliasAnalysis.h"
				19	#include "llvm/Constants.h"
				20	#include "llvm/CallingConv.h"
				21	#include "llvm/DerivedTypes.h"
				22	#include "llvm/Function.h"
				23	#include "llvm/GlobalVariable.h"
				24	#include "llvm/InlineAsm.h"
				25	#include "llvm/Instructions.h"
				26	#include "llvm/Intrinsics.h"
				27	#include "llvm/IntrinsicInst.h"
Bill Wendling	b2a4298	2008-11-06 02:29:10 +0000	[diff] [blame]	28	#include "llvm/Module.h"
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	29	#include "llvm/CodeGen/FastISel.h"
				30	#include "llvm/CodeGen/GCStrategy.h"
				31	#include "llvm/CodeGen/GCMetadata.h"
				32	#include "llvm/CodeGen/MachineFunction.h"
				33	#include "llvm/CodeGen/MachineFrameInfo.h"
				34	#include "llvm/CodeGen/MachineInstrBuilder.h"
				35	#include "llvm/CodeGen/MachineJumpTableInfo.h"
				36	#include "llvm/CodeGen/MachineModuleInfo.h"
				37	#include "llvm/CodeGen/MachineRegisterInfo.h"
Bill Wendling	b2a4298	2008-11-06 02:29:10 +0000	[diff] [blame]	38	#include "llvm/CodeGen/PseudoSourceValue.h"
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	39	#include "llvm/CodeGen/SelectionDAG.h"
				40	#include "llvm/Target/TargetRegisterInfo.h"
				41	#include "llvm/Target/TargetData.h"
				42	#include "llvm/Target/TargetFrameInfo.h"
				43	#include "llvm/Target/TargetInstrInfo.h"
				44	#include "llvm/Target/TargetLowering.h"
				45	#include "llvm/Target/TargetMachine.h"
				46	#include "llvm/Target/TargetOptions.h"
				47	#include "llvm/Support/Compiler.h"
				48	#include "llvm/Support/Debug.h"
				49	#include "llvm/Support/MathExtras.h"
				50	#include <algorithm>
				51	using namespace llvm;
				52
Dale Johannesen	601d3c0	2008-09-05 01:48:15 +0000	[diff] [blame]	53	/// LimitFloatPrecision - Generate low-precision inline sequences for
				54	/// some float libcalls (6, 8 or 12 bits).
				55	static unsigned LimitFloatPrecision;
				56
				57	static cl::opt<unsigned, true>
				58	LimitFPPrecision("limit-float-precision",
				59	cl::desc("Generate low-precision inline sequences "
				60	"for some float libcalls"),
				61	cl::location(LimitFloatPrecision),
				62	cl::init(0));
				63
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	64	/// ComputeLinearIndex - Given an LLVM IR aggregate type and a sequence
				65	/// insertvalue or extractvalue indices that identify a member, return
				66	/// the linearized index of the start of the member.
				67	///
				68	static unsigned ComputeLinearIndex(const TargetLowering &TLI, const Type *Ty,
				69	const unsigned *Indices,
				70	const unsigned *IndicesEnd,
				71	unsigned CurIndex = 0) {
				72	// Base case: We're done.
				73	if (Indices && Indices == IndicesEnd)
				74	return CurIndex;
				75
				76	// Given a struct type, recursively traverse the elements.
				77	if (const StructType *STy = dyn_cast<StructType>(Ty)) {
				78	for (StructType::element_iterator EB = STy->element_begin(),
				79	EI = EB,
				80	EE = STy->element_end();
				81	EI != EE; ++EI) {
				82	if (Indices && *Indices == unsigned(EI - EB))
				83	return ComputeLinearIndex(TLI, *EI, Indices+1, IndicesEnd, CurIndex);
				84	CurIndex = ComputeLinearIndex(TLI, *EI, 0, 0, CurIndex);
				85	}
				86	}
				87	// Given an array type, recursively traverse the elements.
				88	else if (const ArrayType *ATy = dyn_cast<ArrayType>(Ty)) {
				89	const Type *EltTy = ATy->getElementType();
				90	for (unsigned i = 0, e = ATy->getNumElements(); i != e; ++i) {
				91	if (Indices && *Indices == i)
				92	return ComputeLinearIndex(TLI, EltTy, Indices+1, IndicesEnd, CurIndex);
				93	CurIndex = ComputeLinearIndex(TLI, EltTy, 0, 0, CurIndex);
				94	}
				95	}
				96	// We haven't found the type we're looking for, so keep searching.
				97	return CurIndex + 1;
				98	}
				99
				100	/// ComputeValueVTs - Given an LLVM IR type, compute a sequence of
				101	/// MVTs that represent all the individual underlying
				102	/// non-aggregate types that comprise it.
				103	///
				104	/// If Offsets is non-null, it points to a vector to be filled in
				105	/// with the in-memory offsets of each of the individual values.
				106	///
				107	static void ComputeValueVTs(const TargetLowering &TLI, const Type *Ty,
				108	SmallVectorImpl<MVT> &ValueVTs,
				109	SmallVectorImpl<uint64_t> *Offsets = 0,
				110	uint64_t StartingOffset = 0) {
				111	// Given a struct type, recursively traverse the elements.
				112	if (const StructType *STy = dyn_cast<StructType>(Ty)) {
				113	const StructLayout *SL = TLI.getTargetData()->getStructLayout(STy);
				114	for (StructType::element_iterator EB = STy->element_begin(),
				115	EI = EB,
				116	EE = STy->element_end();
				117	EI != EE; ++EI)
				118	ComputeValueVTs(TLI, *EI, ValueVTs, Offsets,
				119	StartingOffset + SL->getElementOffset(EI - EB));
				120	return;
				121	}
				122	// Given an array type, recursively traverse the elements.
				123	if (const ArrayType *ATy = dyn_cast<ArrayType>(Ty)) {
				124	const Type *EltTy = ATy->getElementType();
				125	uint64_t EltSize = TLI.getTargetData()->getABITypeSize(EltTy);
				126	for (unsigned i = 0, e = ATy->getNumElements(); i != e; ++i)
				127	ComputeValueVTs(TLI, EltTy, ValueVTs, Offsets,
				128	StartingOffset + i * EltSize);
				129	return;
				130	}
				131	// Base case: we can get an MVT for this LLVM IR type.
				132	ValueVTs.push_back(TLI.getValueType(Ty));
				133	if (Offsets)
				134	Offsets->push_back(StartingOffset);
				135	}
				136
Dan Gohman	2a7c671	2008-09-03 23:18:39 +0000	[diff] [blame]	137	namespace llvm {
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	138	/// RegsForValue - This struct represents the registers (physical or virtual)
				139	/// that a particular set of values is assigned, and the type information about
				140	/// the value. The most common situation is to represent one value at a time,
				141	/// but struct or array values are handled element-wise as multiple values.
				142	/// The splitting of aggregates is performed recursively, so that we never
				143	/// have aggregate-typed registers. The values at this point do not necessarily
				144	/// have legal types, so each value may require one or more registers of some
				145	/// legal type.
				146	///
				147	struct VISIBILITY_HIDDEN RegsForValue {
				148	/// TLI - The TargetLowering object.
				149	///
				150	const TargetLowering *TLI;
				151
				152	/// ValueVTs - The value types of the values, which may not be legal, and
				153	/// may need be promoted or synthesized from one or more registers.
				154	///
				155	SmallVector<MVT, 4> ValueVTs;
				156
				157	/// RegVTs - The value types of the registers. This is the same size as
				158	/// ValueVTs and it records, for each value, what the type of the assigned
				159	/// register or registers are. (Individual values are never synthesized
				160	/// from more than one type of register.)
				161	///
				162	/// With virtual registers, the contents of RegVTs is redundant with TLI's
				163	/// getRegisterType member function, however when with physical registers
				164	/// it is necessary to have a separate record of the types.
				165	///
				166	SmallVector<MVT, 4> RegVTs;
				167
				168	/// Regs - This list holds the registers assigned to the values.
				169	/// Each legal or promoted value requires one register, and each
				170	/// expanded value requires multiple registers.
				171	///
				172	SmallVector<unsigned, 4> Regs;
				173
				174	RegsForValue() : TLI(0) {}
				175
				176	RegsForValue(const TargetLowering &tli,
				177	const SmallVector<unsigned, 4> &regs,
				178	MVT regvt, MVT valuevt)
				179	: TLI(&tli), ValueVTs(1, valuevt), RegVTs(1, regvt), Regs(regs) {}
				180	RegsForValue(const TargetLowering &tli,
				181	const SmallVector<unsigned, 4> &regs,
				182	const SmallVector<MVT, 4> &regvts,
				183	const SmallVector<MVT, 4> &valuevts)
				184	: TLI(&tli), ValueVTs(valuevts), RegVTs(regvts), Regs(regs) {}
				185	RegsForValue(const TargetLowering &tli,
				186	unsigned Reg, const Type *Ty) : TLI(&tli) {
				187	ComputeValueVTs(tli, Ty, ValueVTs);
				188
				189	for (unsigned Value = 0, e = ValueVTs.size(); Value != e; ++Value) {
				190	MVT ValueVT = ValueVTs[Value];
				191	unsigned NumRegs = TLI->getNumRegisters(ValueVT);
				192	MVT RegisterVT = TLI->getRegisterType(ValueVT);
				193	for (unsigned i = 0; i != NumRegs; ++i)
				194	Regs.push_back(Reg + i);
				195	RegVTs.push_back(RegisterVT);
				196	Reg += NumRegs;
				197	}
				198	}
				199
				200	/// append - Add the specified values to this one.
				201	void append(const RegsForValue &RHS) {
				202	TLI = RHS.TLI;
				203	ValueVTs.append(RHS.ValueVTs.begin(), RHS.ValueVTs.end());
				204	RegVTs.append(RHS.RegVTs.begin(), RHS.RegVTs.end());
				205	Regs.append(RHS.Regs.begin(), RHS.Regs.end());
				206	}
				207
				208
				209	/// getCopyFromRegs - Emit a series of CopyFromReg nodes that copies from
				210	/// this value and returns the result as a ValueVTs value. This uses
				211	/// Chain/Flag as the input and updates them for the output Chain/Flag.
				212	/// If the Flag pointer is NULL, no flag is used.
				213	SDValue getCopyFromRegs(SelectionDAG &DAG,
				214	SDValue &Chain, SDValue *Flag) const;
				215
				216	/// getCopyToRegs - Emit a series of CopyToReg nodes that copies the
				217	/// specified value into the registers specified by this object. This uses
				218	/// Chain/Flag as the input and updates them for the output Chain/Flag.
				219	/// If the Flag pointer is NULL, no flag is used.
				220	void getCopyToRegs(SDValue Val, SelectionDAG &DAG,
				221	SDValue &Chain, SDValue *Flag) const;
				222
				223	/// AddInlineAsmOperands - Add this value to the specified inlineasm node
				224	/// operand list. This adds the code marker and includes the number of
				225	/// values added into it.
				226	void AddInlineAsmOperands(unsigned Code, SelectionDAG &DAG,
				227	std::vector<SDValue> &Ops) const;
				228	};
				229	}
				230
				231	/// isUsedOutsideOfDefiningBlock - Return true if this instruction is used by
				232	/// PHI nodes or outside of the basic block that defines it, or used by a
				233	/// switch or atomic instruction, which may expand to multiple basic blocks.
				234	static bool isUsedOutsideOfDefiningBlock(Instruction *I) {
				235	if (isa<PHINode>(I)) return true;
				236	BasicBlock *BB = I->getParent();
				237	for (Value::use_iterator UI = I->use_begin(), E = I->use_end(); UI != E; ++UI)
				238	if (cast<Instruction>(UI)->getParent() != BB \|\| isa<PHINode>(UI) \|\|
				239	// FIXME: Remove switchinst special case.
				240	isa<SwitchInst>(*UI))
				241	return true;
				242	return false;
				243	}
				244
				245	/// isOnlyUsedInEntryBlock - If the specified argument is only used in the
				246	/// entry block, return true. This includes arguments used by switches, since
				247	/// the switch may expand into multiple basic blocks.
				248	static bool isOnlyUsedInEntryBlock(Argument *A, bool EnableFastISel) {
				249	// With FastISel active, we may be splitting blocks, so force creation
				250	// of virtual registers for all non-dead arguments.
Dan Gohman	33134c4	2008-09-25 17:05:24 +0000	[diff] [blame]	251	// Don't force virtual registers for byval arguments though, because
				252	// fast-isel can't handle those in all cases.
				253	if (EnableFastISel && !A->hasByValAttr())
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	254	return A->use_empty();
				255
				256	BasicBlock *Entry = A->getParent()->begin();
				257	for (Value::use_iterator UI = A->use_begin(), E = A->use_end(); UI != E; ++UI)
				258	if (cast<Instruction>(UI)->getParent() != Entry \|\| isa<SwitchInst>(UI))
				259	return false; // Use not in entry block.
				260	return true;
				261	}
				262
				263	FunctionLoweringInfo::FunctionLoweringInfo(TargetLowering &tli)
				264	: TLI(tli) {
				265	}
				266
				267	void FunctionLoweringInfo::set(Function &fn, MachineFunction &mf,
				268	bool EnableFastISel) {
				269	Fn = &fn;
				270	MF = &mf;
				271	RegInfo = &MF->getRegInfo();
				272
				273	// Create a vreg for each argument register that is not dead and is used
				274	// outside of the entry block for the function.
				275	for (Function::arg_iterator AI = Fn->arg_begin(), E = Fn->arg_end();
				276	AI != E; ++AI)
				277	if (!isOnlyUsedInEntryBlock(AI, EnableFastISel))
				278	InitializeRegForValue(AI);
				279
				280	// Initialize the mapping of values to registers. This is only set up for
				281	// instruction values that are used outside of the block that defines
				282	// them.
				283	Function::iterator BB = Fn->begin(), EB = Fn->end();
				284	for (BasicBlock::iterator I = BB->begin(), E = BB->end(); I != E; ++I)
				285	if (AllocaInst *AI = dyn_cast<AllocaInst>(I))
				286	if (ConstantInt *CUI = dyn_cast<ConstantInt>(AI->getArraySize())) {
				287	const Type *Ty = AI->getAllocatedType();
				288	uint64_t TySize = TLI.getTargetData()->getABITypeSize(Ty);
				289	unsigned Align =
				290	std::max((unsigned)TLI.getTargetData()->getPrefTypeAlignment(Ty),
				291	AI->getAlignment());
				292
				293	TySize *= CUI->getZExtValue(); // Get total allocated size.
				294	if (TySize == 0) TySize = 1; // Don't create zero-sized stack objects.
				295	StaticAllocaMap[AI] =
				296	MF->getFrameInfo()->CreateStackObject(TySize, Align);
				297	}
				298
				299	for (; BB != EB; ++BB)
				300	for (BasicBlock::iterator I = BB->begin(), E = BB->end(); I != E; ++I)
				301	if (!I->use_empty() && isUsedOutsideOfDefiningBlock(I))
				302	if (!isa<AllocaInst>(I) \|\|
				303	!StaticAllocaMap.count(cast<AllocaInst>(I)))
				304	InitializeRegForValue(I);
				305
				306	// Create an initial MachineBasicBlock for each LLVM BasicBlock in F. This
				307	// also creates the initial PHI MachineInstrs, though none of the input
				308	// operands are populated.
				309	for (BB = Fn->begin(), EB = Fn->end(); BB != EB; ++BB) {
				310	MachineBasicBlock *MBB = mf.CreateMachineBasicBlock(BB);
				311	MBBMap[BB] = MBB;
				312	MF->push_back(MBB);
				313
				314	// Create Machine PHI nodes for LLVM PHI nodes, lowering them as
				315	// appropriate.
				316	PHINode *PN;
				317	for (BasicBlock::iterator I = BB->begin();(PN = dyn_cast<PHINode>(I)); ++I){
				318	if (PN->use_empty()) continue;
				319
				320	unsigned PHIReg = ValueMap[PN];
				321	assert(PHIReg && "PHI node does not have an assigned virtual register!");
				322
				323	SmallVector<MVT, 4> ValueVTs;
				324	ComputeValueVTs(TLI, PN->getType(), ValueVTs);
				325	for (unsigned vti = 0, vte = ValueVTs.size(); vti != vte; ++vti) {
				326	MVT VT = ValueVTs[vti];
				327	unsigned NumRegisters = TLI.getNumRegisters(VT);
Dan Gohman	6448d91	2008-09-04 15:39:15 +0000	[diff] [blame]	328	const TargetInstrInfo *TII = MF->getTarget().getInstrInfo();
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	329	for (unsigned i = 0; i != NumRegisters; ++i)
				330	BuildMI(MBB, TII->get(TargetInstrInfo::PHI), PHIReg+i);
				331	PHIReg += NumRegisters;
				332	}
				333	}
				334	}
				335	}
				336
				337	unsigned FunctionLoweringInfo::MakeReg(MVT VT) {
				338	return RegInfo->createVirtualRegister(TLI.getRegClassFor(VT));
				339	}
				340
				341	/// CreateRegForValue - Allocate the appropriate number of virtual registers of
				342	/// the correctly promoted or expanded types. Assign these registers
				343	/// consecutive vreg numbers and return the first assigned number.
				344	///
				345	/// In the case that the given value has struct or array type, this function
				346	/// will assign registers for each member or element.
				347	///
				348	unsigned FunctionLoweringInfo::CreateRegForValue(const Value *V) {
				349	SmallVector<MVT, 4> ValueVTs;
				350	ComputeValueVTs(TLI, V->getType(), ValueVTs);
				351
				352	unsigned FirstReg = 0;
				353	for (unsigned Value = 0, e = ValueVTs.size(); Value != e; ++Value) {
				354	MVT ValueVT = ValueVTs[Value];
				355	MVT RegisterVT = TLI.getRegisterType(ValueVT);
				356
				357	unsigned NumRegs = TLI.getNumRegisters(ValueVT);
				358	for (unsigned i = 0; i != NumRegs; ++i) {
				359	unsigned R = MakeReg(RegisterVT);
				360	if (!FirstReg) FirstReg = R;
				361	}
				362	}
				363	return FirstReg;
				364	}
				365
				366	/// getCopyFromParts - Create a value that contains the specified legal parts
				367	/// combined into the value they represent. If the parts combine to a type
				368	/// larger then ValueVT then AssertOp can be used to specify whether the extra
				369	/// bits are known to be zero (ISD::AssertZext) or sign extended from ValueVT
				370	/// (ISD::AssertSext).
				371	static SDValue getCopyFromParts(SelectionDAG &DAG,
				372	const SDValue *Parts,
				373	unsigned NumParts,
				374	MVT PartVT,
				375	MVT ValueVT,
				376	ISD::NodeType AssertOp = ISD::DELETED_NODE) {
				377	assert(NumParts > 0 && "No parts to assemble!");
				378	TargetLowering &TLI = DAG.getTargetLoweringInfo();
				379	SDValue Val = Parts[0];
				380
				381	if (NumParts > 1) {
				382	// Assemble the value from multiple parts.
				383	if (!ValueVT.isVector()) {
				384	unsigned PartBits = PartVT.getSizeInBits();
				385	unsigned ValueBits = ValueVT.getSizeInBits();
				386
				387	// Assemble the power of 2 part.
				388	unsigned RoundParts = NumParts & (NumParts - 1) ?
				389	1 << Log2_32(NumParts) : NumParts;
				390	unsigned RoundBits = PartBits * RoundParts;
				391	MVT RoundVT = RoundBits == ValueBits ?
				392	ValueVT : MVT::getIntegerVT(RoundBits);
				393	SDValue Lo, Hi;
				394
Duncan Sands	d22ec5f	2008-10-29 14:22:20 +0000	[diff] [blame]	395	MVT HalfVT = ValueVT.isInteger() ?
				396	MVT::getIntegerVT(RoundBits/2) :
				397	MVT::getFloatingPointVT(RoundBits/2);
				398
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	399	if (RoundParts > 2) {
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	400	Lo = getCopyFromParts(DAG, Parts, RoundParts/2, PartVT, HalfVT);
				401	Hi = getCopyFromParts(DAG, Parts+RoundParts/2, RoundParts/2,
				402	PartVT, HalfVT);
				403	} else {
Duncan Sands	d22ec5f	2008-10-29 14:22:20 +0000	[diff] [blame]	404	Lo = DAG.getNode(ISD::BIT_CONVERT, HalfVT, Parts[0]);
				405	Hi = DAG.getNode(ISD::BIT_CONVERT, HalfVT, Parts[1]);
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	406	}
				407	if (TLI.isBigEndian())
				408	std::swap(Lo, Hi);
				409	Val = DAG.getNode(ISD::BUILD_PAIR, RoundVT, Lo, Hi);
				410
				411	if (RoundParts < NumParts) {
				412	// Assemble the trailing non-power-of-2 part.
				413	unsigned OddParts = NumParts - RoundParts;
				414	MVT OddVT = MVT::getIntegerVT(OddParts * PartBits);
				415	Hi = getCopyFromParts(DAG, Parts+RoundParts, OddParts, PartVT, OddVT);
				416
				417	// Combine the round and odd parts.
				418	Lo = Val;
				419	if (TLI.isBigEndian())
				420	std::swap(Lo, Hi);
				421	MVT TotalVT = MVT::getIntegerVT(NumParts * PartBits);
				422	Hi = DAG.getNode(ISD::ANY_EXTEND, TotalVT, Hi);
				423	Hi = DAG.getNode(ISD::SHL, TotalVT, Hi,
				424	DAG.getConstant(Lo.getValueType().getSizeInBits(),
				425	TLI.getShiftAmountTy()));
				426	Lo = DAG.getNode(ISD::ZERO_EXTEND, TotalVT, Lo);
				427	Val = DAG.getNode(ISD::OR, TotalVT, Lo, Hi);
				428	}
				429	} else {
				430	// Handle a multi-element vector.
				431	MVT IntermediateVT, RegisterVT;
				432	unsigned NumIntermediates;
				433	unsigned NumRegs =
				434	TLI.getVectorTypeBreakdown(ValueVT, IntermediateVT, NumIntermediates,
				435	RegisterVT);
				436	assert(NumRegs == NumParts && "Part count doesn't match vector breakdown!");
				437	NumParts = NumRegs; // Silence a compiler warning.
				438	assert(RegisterVT == PartVT && "Part type doesn't match vector breakdown!");
				439	assert(RegisterVT == Parts[0].getValueType() &&
				440	"Part type doesn't match part!");
				441
				442	// Assemble the parts into intermediate operands.
				443	SmallVector<SDValue, 8> Ops(NumIntermediates);
				444	if (NumIntermediates == NumParts) {
				445	// If the register was not expanded, truncate or copy the value,
				446	// as appropriate.
				447	for (unsigned i = 0; i != NumParts; ++i)
				448	Ops[i] = getCopyFromParts(DAG, &Parts[i], 1,
				449	PartVT, IntermediateVT);
				450	} else if (NumParts > 0) {
				451	// If the intermediate type was expanded, build the intermediate operands
				452	// from the parts.
				453	assert(NumParts % NumIntermediates == 0 &&
				454	"Must expand into a divisible number of parts!");
				455	unsigned Factor = NumParts / NumIntermediates;
				456	for (unsigned i = 0; i != NumIntermediates; ++i)
				457	Ops[i] = getCopyFromParts(DAG, &Parts[i * Factor], Factor,
				458	PartVT, IntermediateVT);
				459	}
				460
				461	// Build a vector with BUILD_VECTOR or CONCAT_VECTORS from the intermediate
				462	// operands.
				463	Val = DAG.getNode(IntermediateVT.isVector() ?
				464	ISD::CONCAT_VECTORS : ISD::BUILD_VECTOR,
				465	ValueVT, &Ops[0], NumIntermediates);
				466	}
				467	}
				468
				469	// There is now one part, held in Val. Correct it to match ValueVT.
				470	PartVT = Val.getValueType();
				471
				472	if (PartVT == ValueVT)
				473	return Val;
				474
				475	if (PartVT.isVector()) {
				476	assert(ValueVT.isVector() && "Unknown vector conversion!");
				477	return DAG.getNode(ISD::BIT_CONVERT, ValueVT, Val);
				478	}
				479
				480	if (ValueVT.isVector()) {
				481	assert(ValueVT.getVectorElementType() == PartVT &&
				482	ValueVT.getVectorNumElements() == 1 &&
				483	"Only trivial scalar-to-vector conversions should get here!");
				484	return DAG.getNode(ISD::BUILD_VECTOR, ValueVT, Val);
				485	}
				486
				487	if (PartVT.isInteger() &&
				488	ValueVT.isInteger()) {
				489	if (ValueVT.bitsLT(PartVT)) {
				490	// For a truncate, see if we have any information to
				491	// indicate whether the truncated bits will always be
				492	// zero or sign-extension.
				493	if (AssertOp != ISD::DELETED_NODE)
				494	Val = DAG.getNode(AssertOp, PartVT, Val,
				495	DAG.getValueType(ValueVT));
				496	return DAG.getNode(ISD::TRUNCATE, ValueVT, Val);
				497	} else {
				498	return DAG.getNode(ISD::ANY_EXTEND, ValueVT, Val);
				499	}
				500	}
				501
				502	if (PartVT.isFloatingPoint() && ValueVT.isFloatingPoint()) {
				503	if (ValueVT.bitsLT(Val.getValueType()))
				504	// FP_ROUND's are always exact here.
				505	return DAG.getNode(ISD::FP_ROUND, ValueVT, Val,
				506	DAG.getIntPtrConstant(1));
				507	return DAG.getNode(ISD::FP_EXTEND, ValueVT, Val);
				508	}
				509
				510	if (PartVT.getSizeInBits() == ValueVT.getSizeInBits())
				511	return DAG.getNode(ISD::BIT_CONVERT, ValueVT, Val);
				512
				513	assert(0 && "Unknown mismatch!");
				514	return SDValue();
				515	}
				516
				517	/// getCopyToParts - Create a series of nodes that contain the specified value
				518	/// split into legal parts. If the parts contain more bits than Val, then, for
				519	/// integers, ExtendKind can be used to specify how to generate the extra bits.
Chris Lattner	01426e1	2008-10-21 00:45:36 +0000	[diff] [blame]	520	static void getCopyToParts(SelectionDAG &DAG, SDValue Val,
				521	SDValue *Parts, unsigned NumParts, MVT PartVT,
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	522	ISD::NodeType ExtendKind = ISD::ANY_EXTEND) {
				523	TargetLowering &TLI = DAG.getTargetLoweringInfo();
				524	MVT PtrVT = TLI.getPointerTy();
				525	MVT ValueVT = Val.getValueType();
				526	unsigned PartBits = PartVT.getSizeInBits();
				527	assert(TLI.isTypeLegal(PartVT) && "Copying to an illegal type!");
				528
				529	if (!NumParts)
				530	return;
				531
				532	if (!ValueVT.isVector()) {
				533	if (PartVT == ValueVT) {
				534	assert(NumParts == 1 && "No-op copy with multiple parts!");
				535	Parts[0] = Val;
				536	return;
				537	}
				538
				539	if (NumParts * PartBits > ValueVT.getSizeInBits()) {
				540	// If the parts cover more bits than the value has, promote the value.
				541	if (PartVT.isFloatingPoint() && ValueVT.isFloatingPoint()) {
				542	assert(NumParts == 1 && "Do not know what to promote to!");
				543	Val = DAG.getNode(ISD::FP_EXTEND, PartVT, Val);
				544	} else if (PartVT.isInteger() && ValueVT.isInteger()) {
				545	ValueVT = MVT::getIntegerVT(NumParts * PartBits);
				546	Val = DAG.getNode(ExtendKind, ValueVT, Val);
				547	} else {
				548	assert(0 && "Unknown mismatch!");
				549	}
				550	} else if (PartBits == ValueVT.getSizeInBits()) {
				551	// Different types of the same size.
				552	assert(NumParts == 1 && PartVT != ValueVT);
				553	Val = DAG.getNode(ISD::BIT_CONVERT, PartVT, Val);
				554	} else if (NumParts * PartBits < ValueVT.getSizeInBits()) {
				555	// If the parts cover less bits than value has, truncate the value.
				556	if (PartVT.isInteger() && ValueVT.isInteger()) {
				557	ValueVT = MVT::getIntegerVT(NumParts * PartBits);
				558	Val = DAG.getNode(ISD::TRUNCATE, ValueVT, Val);
				559	} else {
				560	assert(0 && "Unknown mismatch!");
				561	}
				562	}
				563
				564	// The value may have changed - recompute ValueVT.
				565	ValueVT = Val.getValueType();
				566	assert(NumParts * PartBits == ValueVT.getSizeInBits() &&
				567	"Failed to tile the value with PartVT!");
				568
				569	if (NumParts == 1) {
				570	assert(PartVT == ValueVT && "Type conversion failed!");
				571	Parts[0] = Val;
				572	return;
				573	}
				574
				575	// Expand the value into multiple parts.
				576	if (NumParts & (NumParts - 1)) {
				577	// The number of parts is not a power of 2. Split off and copy the tail.
				578	assert(PartVT.isInteger() && ValueVT.isInteger() &&
				579	"Do not know what to expand to!");
				580	unsigned RoundParts = 1 << Log2_32(NumParts);
				581	unsigned RoundBits = RoundParts * PartBits;
				582	unsigned OddParts = NumParts - RoundParts;
				583	SDValue OddVal = DAG.getNode(ISD::SRL, ValueVT, Val,
				584	DAG.getConstant(RoundBits,
				585	TLI.getShiftAmountTy()));
				586	getCopyToParts(DAG, OddVal, Parts + RoundParts, OddParts, PartVT);
				587	if (TLI.isBigEndian())
				588	// The odd parts were reversed by getCopyToParts - unreverse them.
				589	std::reverse(Parts + RoundParts, Parts + NumParts);
				590	NumParts = RoundParts;
				591	ValueVT = MVT::getIntegerVT(NumParts * PartBits);
				592	Val = DAG.getNode(ISD::TRUNCATE, ValueVT, Val);
				593	}
				594
				595	// The number of parts is a power of 2. Repeatedly bisect the value using
				596	// EXTRACT_ELEMENT.
				597	Parts[0] = DAG.getNode(ISD::BIT_CONVERT,
				598	MVT::getIntegerVT(ValueVT.getSizeInBits()),
				599	Val);
				600	for (unsigned StepSize = NumParts; StepSize > 1; StepSize /= 2) {
				601	for (unsigned i = 0; i < NumParts; i += StepSize) {
				602	unsigned ThisBits = StepSize * PartBits / 2;
				603	MVT ThisVT = MVT::getIntegerVT (ThisBits);
				604	SDValue &Part0 = Parts[i];
				605	SDValue &Part1 = Parts[i+StepSize/2];
				606
				607	Part1 = DAG.getNode(ISD::EXTRACT_ELEMENT, ThisVT, Part0,
				608	DAG.getConstant(1, PtrVT));
				609	Part0 = DAG.getNode(ISD::EXTRACT_ELEMENT, ThisVT, Part0,
				610	DAG.getConstant(0, PtrVT));
				611
				612	if (ThisBits == PartBits && ThisVT != PartVT) {
				613	Part0 = DAG.getNode(ISD::BIT_CONVERT, PartVT, Part0);
				614	Part1 = DAG.getNode(ISD::BIT_CONVERT, PartVT, Part1);
				615	}
				616	}
				617	}
				618
				619	if (TLI.isBigEndian())
				620	std::reverse(Parts, Parts + NumParts);
				621
				622	return;
				623	}
				624
				625	// Vector ValueVT.
				626	if (NumParts == 1) {
				627	if (PartVT != ValueVT) {
				628	if (PartVT.isVector()) {
				629	Val = DAG.getNode(ISD::BIT_CONVERT, PartVT, Val);
				630	} else {
				631	assert(ValueVT.getVectorElementType() == PartVT &&
				632	ValueVT.getVectorNumElements() == 1 &&
				633	"Only trivial vector-to-scalar conversions should get here!");
				634	Val = DAG.getNode(ISD::EXTRACT_VECTOR_ELT, PartVT, Val,
				635	DAG.getConstant(0, PtrVT));
				636	}
				637	}
				638
				639	Parts[0] = Val;
				640	return;
				641	}
				642
				643	// Handle a multi-element vector.
				644	MVT IntermediateVT, RegisterVT;
				645	unsigned NumIntermediates;
				646	unsigned NumRegs =
				647	DAG.getTargetLoweringInfo()
				648	.getVectorTypeBreakdown(ValueVT, IntermediateVT, NumIntermediates,
				649	RegisterVT);
				650	unsigned NumElements = ValueVT.getVectorNumElements();
				651
				652	assert(NumRegs == NumParts && "Part count doesn't match vector breakdown!");
				653	NumParts = NumRegs; // Silence a compiler warning.
				654	assert(RegisterVT == PartVT && "Part type doesn't match vector breakdown!");
				655
				656	// Split the vector into intermediate operands.
				657	SmallVector<SDValue, 8> Ops(NumIntermediates);
				658	for (unsigned i = 0; i != NumIntermediates; ++i)
				659	if (IntermediateVT.isVector())
				660	Ops[i] = DAG.getNode(ISD::EXTRACT_SUBVECTOR,
				661	IntermediateVT, Val,
				662	DAG.getConstant(i * (NumElements / NumIntermediates),
				663	PtrVT));
				664	else
				665	Ops[i] = DAG.getNode(ISD::EXTRACT_VECTOR_ELT,
				666	IntermediateVT, Val,
				667	DAG.getConstant(i, PtrVT));
				668
				669	// Split the intermediate operands into legal parts.
				670	if (NumParts == NumIntermediates) {
				671	// If the register was not expanded, promote or copy the value,
				672	// as appropriate.
				673	for (unsigned i = 0; i != NumParts; ++i)
				674	getCopyToParts(DAG, Ops[i], &Parts[i], 1, PartVT);
				675	} else if (NumParts > 0) {
				676	// If the intermediate type was expanded, split each the value into
				677	// legal parts.
				678	assert(NumParts % NumIntermediates == 0 &&
				679	"Must expand into a divisible number of parts!");
				680	unsigned Factor = NumParts / NumIntermediates;
				681	for (unsigned i = 0; i != NumIntermediates; ++i)
				682	getCopyToParts(DAG, Ops[i], &Parts[i * Factor], Factor, PartVT);
				683	}
				684	}
				685
				686
				687	void SelectionDAGLowering::init(GCFunctionInfo *gfi, AliasAnalysis &aa) {
				688	AA = &aa;
				689	GFI = gfi;
				690	TD = DAG.getTarget().getTargetData();
				691	}
				692
				693	/// clear - Clear out the curret SelectionDAG and the associated
				694	/// state and prepare this SelectionDAGLowering object to be used
				695	/// for a new block. This doesn't clear out information about
				696	/// additional blocks that are needed to complete switch lowering
				697	/// or PHI node updating; that information is cleared out as it is
				698	/// consumed.
				699	void SelectionDAGLowering::clear() {
				700	NodeMap.clear();
				701	PendingLoads.clear();
				702	PendingExports.clear();
				703	DAG.clear();
				704	}
				705
				706	/// getRoot - Return the current virtual root of the Selection DAG,
				707	/// flushing any PendingLoad items. This must be done before emitting
				708	/// a store or any other node that may need to be ordered after any
				709	/// prior load instructions.
				710	///
				711	SDValue SelectionDAGLowering::getRoot() {
				712	if (PendingLoads.empty())
				713	return DAG.getRoot();
				714
				715	if (PendingLoads.size() == 1) {
				716	SDValue Root = PendingLoads[0];
				717	DAG.setRoot(Root);
				718	PendingLoads.clear();
				719	return Root;
				720	}
				721
				722	// Otherwise, we have to make a token factor node.
				723	SDValue Root = DAG.getNode(ISD::TokenFactor, MVT::Other,
				724	&PendingLoads[0], PendingLoads.size());
				725	PendingLoads.clear();
				726	DAG.setRoot(Root);
				727	return Root;
				728	}
				729
				730	/// getControlRoot - Similar to getRoot, but instead of flushing all the
				731	/// PendingLoad items, flush all the PendingExports items. It is necessary
				732	/// to do this before emitting a terminator instruction.
				733	///
				734	SDValue SelectionDAGLowering::getControlRoot() {
				735	SDValue Root = DAG.getRoot();
				736
				737	if (PendingExports.empty())
				738	return Root;
				739
				740	// Turn all of the CopyToReg chains into one factored node.
				741	if (Root.getOpcode() != ISD::EntryToken) {
				742	unsigned i = 0, e = PendingExports.size();
				743	for (; i != e; ++i) {
				744	assert(PendingExports[i].getNode()->getNumOperands() > 1);
				745	if (PendingExports[i].getNode()->getOperand(0) == Root)
				746	break; // Don't add the root if we already indirectly depend on it.
				747	}
				748
				749	if (i == e)
				750	PendingExports.push_back(Root);
				751	}
				752
				753	Root = DAG.getNode(ISD::TokenFactor, MVT::Other,
				754	&PendingExports[0],
				755	PendingExports.size());
				756	PendingExports.clear();
				757	DAG.setRoot(Root);
				758	return Root;
				759	}
				760
				761	void SelectionDAGLowering::visit(Instruction &I) {
				762	visit(I.getOpcode(), I);
				763	}
				764
				765	void SelectionDAGLowering::visit(unsigned Opcode, User &I) {
				766	// Note: this doesn't use InstVisitor, because it has to work with
				767	// ConstantExpr's in addition to instructions.
				768	switch (Opcode) {
				769	default: assert(0 && "Unknown instruction type encountered!");
				770	abort();
				771	// Build the switch statement using the Instruction.def file.
				772	#define HANDLE_INST(NUM, OPCODE, CLASS) \
				773	case Instruction::OPCODE:return visit##OPCODE((CLASS&)I);
				774	#include "llvm/Instruction.def"
				775	}
				776	}
				777
				778	void SelectionDAGLowering::visitAdd(User &I) {
				779	if (I.getType()->isFPOrFPVector())
				780	visitBinary(I, ISD::FADD);
				781	else
				782	visitBinary(I, ISD::ADD);
				783	}
				784
				785	void SelectionDAGLowering::visitMul(User &I) {
				786	if (I.getType()->isFPOrFPVector())
				787	visitBinary(I, ISD::FMUL);
				788	else
				789	visitBinary(I, ISD::MUL);
				790	}
				791
				792	SDValue SelectionDAGLowering::getValue(const Value *V) {
				793	SDValue &N = NodeMap[V];
				794	if (N.getNode()) return N;
				795
				796	if (Constant C = const_cast<Constant>(dyn_cast<Constant>(V))) {
				797	MVT VT = TLI.getValueType(V->getType(), true);
				798
				799	if (ConstantInt *CI = dyn_cast<ConstantInt>(C))
Dan Gohman	4fbd796	2008-09-12 18:08:03 +0000	[diff] [blame]	800	return N = DAG.getConstant(*CI, VT);
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	801
				802	if (GlobalValue *GV = dyn_cast<GlobalValue>(C))
				803	return N = DAG.getGlobalAddress(GV, VT);
				804
				805	if (isa<ConstantPointerNull>(C))
				806	return N = DAG.getConstant(0, TLI.getPointerTy());
				807
				808	if (ConstantFP *CFP = dyn_cast<ConstantFP>(C))
Dan Gohman	4fbd796	2008-09-12 18:08:03 +0000	[diff] [blame]	809	return N = DAG.getConstantFP(*CFP, VT);
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	810
				811	if (isa<UndefValue>(C) && !isa<VectorType>(V->getType()) &&
				812	!V->getType()->isAggregateType())
				813	return N = DAG.getNode(ISD::UNDEF, VT);
				814
				815	if (ConstantExpr *CE = dyn_cast<ConstantExpr>(C)) {
				816	visit(CE->getOpcode(), *CE);
				817	SDValue N1 = NodeMap[V];
				818	assert(N1.getNode() && "visit didn't populate the ValueMap!");
				819	return N1;
				820	}
				821
				822	if (isa<ConstantStruct>(C) \|\| isa<ConstantArray>(C)) {
				823	SmallVector<SDValue, 4> Constants;
				824	for (User::const_op_iterator OI = C->op_begin(), OE = C->op_end();
				825	OI != OE; ++OI) {
				826	SDNode Val = getValue(OI).getNode();
				827	for (unsigned i = 0, e = Val->getNumValues(); i != e; ++i)
				828	Constants.push_back(SDValue(Val, i));
				829	}
				830	return DAG.getMergeValues(&Constants[0], Constants.size());
				831	}
				832
				833	if (isa<StructType>(C->getType()) \|\| isa<ArrayType>(C->getType())) {
				834	assert((isa<ConstantAggregateZero>(C) \|\| isa<UndefValue>(C)) &&
				835	"Unknown struct or array constant!");
				836
				837	SmallVector<MVT, 4> ValueVTs;
				838	ComputeValueVTs(TLI, C->getType(), ValueVTs);
				839	unsigned NumElts = ValueVTs.size();
				840	if (NumElts == 0)
				841	return SDValue(); // empty struct
				842	SmallVector<SDValue, 4> Constants(NumElts);
				843	for (unsigned i = 0; i != NumElts; ++i) {
				844	MVT EltVT = ValueVTs[i];
				845	if (isa<UndefValue>(C))
				846	Constants[i] = DAG.getNode(ISD::UNDEF, EltVT);
				847	else if (EltVT.isFloatingPoint())
				848	Constants[i] = DAG.getConstantFP(0, EltVT);
				849	else
				850	Constants[i] = DAG.getConstant(0, EltVT);
				851	}
				852	return DAG.getMergeValues(&Constants[0], NumElts);
				853	}
				854
				855	const VectorType *VecTy = cast<VectorType>(V->getType());
				856	unsigned NumElements = VecTy->getNumElements();
				857
				858	// Now that we know the number and type of the elements, get that number of
				859	// elements into the Ops array based on what kind of constant it is.
				860	SmallVector<SDValue, 16> Ops;
				861	if (ConstantVector *CP = dyn_cast<ConstantVector>(C)) {
				862	for (unsigned i = 0; i != NumElements; ++i)
				863	Ops.push_back(getValue(CP->getOperand(i)));
				864	} else {
				865	assert((isa<ConstantAggregateZero>(C) \|\| isa<UndefValue>(C)) &&
				866	"Unknown vector constant!");
				867	MVT EltVT = TLI.getValueType(VecTy->getElementType());
				868
				869	SDValue Op;
				870	if (isa<UndefValue>(C))
				871	Op = DAG.getNode(ISD::UNDEF, EltVT);
				872	else if (EltVT.isFloatingPoint())
				873	Op = DAG.getConstantFP(0, EltVT);
				874	else
				875	Op = DAG.getConstant(0, EltVT);
				876	Ops.assign(NumElements, Op);
				877	}
				878
				879	// Create a BUILD_VECTOR node.
				880	return NodeMap[V] = DAG.getNode(ISD::BUILD_VECTOR, VT, &Ops[0], Ops.size());
				881	}
				882
				883	// If this is a static alloca, generate it as the frameindex instead of
				884	// computation.
				885	if (const AllocaInst *AI = dyn_cast<AllocaInst>(V)) {
				886	DenseMap<const AllocaInst*, int>::iterator SI =
				887	FuncInfo.StaticAllocaMap.find(AI);
				888	if (SI != FuncInfo.StaticAllocaMap.end())
				889	return DAG.getFrameIndex(SI->second, TLI.getPointerTy());
				890	}
				891
				892	unsigned InReg = FuncInfo.ValueMap[V];
				893	assert(InReg && "Value not in map!");
				894
				895	RegsForValue RFV(TLI, InReg, V->getType());
				896	SDValue Chain = DAG.getEntryNode();
				897	return RFV.getCopyFromRegs(DAG, Chain, NULL);
				898	}
				899
				900
				901	void SelectionDAGLowering::visitRet(ReturnInst &I) {
				902	if (I.getNumOperands() == 0) {
				903	DAG.setRoot(DAG.getNode(ISD::RET, MVT::Other, getControlRoot()));
				904	return;
				905	}
				906
				907	SmallVector<SDValue, 8> NewValues;
				908	NewValues.push_back(getControlRoot());
				909	for (unsigned i = 0, e = I.getNumOperands(); i != e; ++i) {
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	910	SmallVector<MVT, 4> ValueVTs;
				911	ComputeValueVTs(TLI, I.getOperand(i)->getType(), ValueVTs);
Dan Gohman	7ea1ca6	2008-10-21 20:00:42 +0000	[diff] [blame]	912	unsigned NumValues = ValueVTs.size();
				913	if (NumValues == 0) continue;
				914
				915	SDValue RetOp = getValue(I.getOperand(i));
				916	for (unsigned j = 0, f = NumValues; j != f; ++j) {
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	917	MVT VT = ValueVTs[j];
				918
				919	// FIXME: C calling convention requires the return type to be promoted to
Dale Johannesen	c9c6da6	2008-09-25 20:47:45 +0000	[diff] [blame]	920	// at least 32-bit. But this is not necessary for non-C calling
				921	// conventions.
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	922	if (VT.isInteger()) {
				923	MVT MinVT = TLI.getRegisterType(MVT::i32);
				924	if (VT.bitsLT(MinVT))
				925	VT = MinVT;
				926	}
				927
				928	unsigned NumParts = TLI.getNumRegisters(VT);
				929	MVT PartVT = TLI.getRegisterType(VT);
				930	SmallVector<SDValue, 4> Parts(NumParts);
				931	ISD::NodeType ExtendKind = ISD::ANY_EXTEND;
				932
				933	const Function *F = I.getParent()->getParent();
Devang Patel	0598866	2008-09-25 21:00:45 +0000	[diff] [blame]	934	if (F->paramHasAttr(0, Attribute::SExt))
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	935	ExtendKind = ISD::SIGN_EXTEND;
Devang Patel	0598866	2008-09-25 21:00:45 +0000	[diff] [blame]	936	else if (F->paramHasAttr(0, Attribute::ZExt))
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	937	ExtendKind = ISD::ZERO_EXTEND;
				938
				939	getCopyToParts(DAG, SDValue(RetOp.getNode(), RetOp.getResNo() + j),
				940	&Parts[0], NumParts, PartVT, ExtendKind);
				941
Dale Johannesen	c9c6da6	2008-09-25 20:47:45 +0000	[diff] [blame]	942	// 'inreg' on function refers to return value
				943	ISD::ArgFlagsTy Flags = ISD::ArgFlagsTy();
Devang Patel	0598866	2008-09-25 21:00:45 +0000	[diff] [blame]	944	if (F->paramHasAttr(0, Attribute::InReg))
Dale Johannesen	c9c6da6	2008-09-25 20:47:45 +0000	[diff] [blame]	945	Flags.setInReg();
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	946	for (unsigned i = 0; i < NumParts; ++i) {
				947	NewValues.push_back(Parts[i]);
Dale Johannesen	c9c6da6	2008-09-25 20:47:45 +0000	[diff] [blame]	948	NewValues.push_back(DAG.getArgFlags(Flags));
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	949	}
				950	}
				951	}
				952	DAG.setRoot(DAG.getNode(ISD::RET, MVT::Other,
				953	&NewValues[0], NewValues.size()));
				954	}
				955
				956	/// ExportFromCurrentBlock - If this condition isn't known to be exported from
				957	/// the current basic block, add it to ValueMap now so that we'll get a
				958	/// CopyTo/FromReg.
				959	void SelectionDAGLowering::ExportFromCurrentBlock(Value *V) {
				960	// No need to export constants.
				961	if (!isa<Instruction>(V) && !isa<Argument>(V)) return;
				962
				963	// Already exported?
				964	if (FuncInfo.isExportedInst(V)) return;
				965
				966	unsigned Reg = FuncInfo.InitializeRegForValue(V);
				967	CopyValueToVirtualRegister(V, Reg);
				968	}
				969
				970	bool SelectionDAGLowering::isExportableFromCurrentBlock(Value *V,
				971	const BasicBlock *FromBB) {
				972	// The operands of the setcc have to be in this block. We don't know
				973	// how to export them from some other block.
				974	if (Instruction *VI = dyn_cast<Instruction>(V)) {
				975	// Can export from current BB.
				976	if (VI->getParent() == FromBB)
				977	return true;
				978
				979	// Is already exported, noop.
				980	return FuncInfo.isExportedInst(V);
				981	}
				982
				983	// If this is an argument, we can export it if the BB is the entry block or
				984	// if it is already exported.
				985	if (isa<Argument>(V)) {
				986	if (FromBB == &FromBB->getParent()->getEntryBlock())
				987	return true;
				988
				989	// Otherwise, can only export this if it is already exported.
				990	return FuncInfo.isExportedInst(V);
				991	}
				992
				993	// Otherwise, constants can always be exported.
				994	return true;
				995	}
				996
				997	static bool InBlock(const Value V, const BasicBlock BB) {
				998	if (const Instruction *I = dyn_cast<Instruction>(V))
				999	return I->getParent() == BB;
				1000	return true;
				1001	}
				1002
Dan Gohman	8c1a6ca	2008-10-17 18:18:45 +0000	[diff] [blame]	1003	/// getFCmpCondCode - Return the ISD condition code corresponding to
				1004	/// the given LLVM IR floating-point condition code. This includes
				1005	/// consideration of global floating-point math flags.
				1006	///
				1007	static ISD::CondCode getFCmpCondCode(FCmpInst::Predicate Pred) {
				1008	ISD::CondCode FPC, FOC;
				1009	switch (Pred) {
				1010	case FCmpInst::FCMP_FALSE: FOC = FPC = ISD::SETFALSE; break;
				1011	case FCmpInst::FCMP_OEQ: FOC = ISD::SETEQ; FPC = ISD::SETOEQ; break;
				1012	case FCmpInst::FCMP_OGT: FOC = ISD::SETGT; FPC = ISD::SETOGT; break;
				1013	case FCmpInst::FCMP_OGE: FOC = ISD::SETGE; FPC = ISD::SETOGE; break;
				1014	case FCmpInst::FCMP_OLT: FOC = ISD::SETLT; FPC = ISD::SETOLT; break;
				1015	case FCmpInst::FCMP_OLE: FOC = ISD::SETLE; FPC = ISD::SETOLE; break;
				1016	case FCmpInst::FCMP_ONE: FOC = ISD::SETNE; FPC = ISD::SETONE; break;
				1017	case FCmpInst::FCMP_ORD: FOC = FPC = ISD::SETO; break;
				1018	case FCmpInst::FCMP_UNO: FOC = FPC = ISD::SETUO; break;
				1019	case FCmpInst::FCMP_UEQ: FOC = ISD::SETEQ; FPC = ISD::SETUEQ; break;
				1020	case FCmpInst::FCMP_UGT: FOC = ISD::SETGT; FPC = ISD::SETUGT; break;
				1021	case FCmpInst::FCMP_UGE: FOC = ISD::SETGE; FPC = ISD::SETUGE; break;
				1022	case FCmpInst::FCMP_ULT: FOC = ISD::SETLT; FPC = ISD::SETULT; break;
				1023	case FCmpInst::FCMP_ULE: FOC = ISD::SETLE; FPC = ISD::SETULE; break;
				1024	case FCmpInst::FCMP_UNE: FOC = ISD::SETNE; FPC = ISD::SETUNE; break;
				1025	case FCmpInst::FCMP_TRUE: FOC = FPC = ISD::SETTRUE; break;
				1026	default:
				1027	assert(0 && "Invalid FCmp predicate opcode!");
				1028	FOC = FPC = ISD::SETFALSE;
				1029	break;
				1030	}
				1031	if (FiniteOnlyFPMath())
				1032	return FOC;
				1033	else
				1034	return FPC;
				1035	}
				1036
				1037	/// getICmpCondCode - Return the ISD condition code corresponding to
				1038	/// the given LLVM IR integer condition code.
				1039	///
				1040	static ISD::CondCode getICmpCondCode(ICmpInst::Predicate Pred) {
				1041	switch (Pred) {
				1042	case ICmpInst::ICMP_EQ: return ISD::SETEQ;
				1043	case ICmpInst::ICMP_NE: return ISD::SETNE;
				1044	case ICmpInst::ICMP_SLE: return ISD::SETLE;
				1045	case ICmpInst::ICMP_ULE: return ISD::SETULE;
				1046	case ICmpInst::ICMP_SGE: return ISD::SETGE;
				1047	case ICmpInst::ICMP_UGE: return ISD::SETUGE;
				1048	case ICmpInst::ICMP_SLT: return ISD::SETLT;
				1049	case ICmpInst::ICMP_ULT: return ISD::SETULT;
				1050	case ICmpInst::ICMP_SGT: return ISD::SETGT;
				1051	case ICmpInst::ICMP_UGT: return ISD::SETUGT;
				1052	default:
				1053	assert(0 && "Invalid ICmp predicate opcode!");
				1054	return ISD::SETNE;
				1055	}
				1056	}
				1057
Dan Gohman	c227734	2008-10-17 21:16:08 +0000	[diff] [blame]	1058	/// EmitBranchForMergedCondition - Helper method for FindMergedConditions.
				1059	/// This function emits a branch and is used at the leaves of an OR or an
				1060	/// AND operator tree.
				1061	///
				1062	void
				1063	SelectionDAGLowering::EmitBranchForMergedCondition(Value *Cond,
				1064	MachineBasicBlock *TBB,
				1065	MachineBasicBlock *FBB,
				1066	MachineBasicBlock *CurBB) {
				1067	const BasicBlock *BB = CurBB->getBasicBlock();
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	1068
Dan Gohman	c227734	2008-10-17 21:16:08 +0000	[diff] [blame]	1069	// If the leaf of the tree is a comparison, merge the condition into
				1070	// the caseblock.
				1071	if (CmpInst *BOp = dyn_cast<CmpInst>(Cond)) {
				1072	// The operands of the cmp have to be in this block. We don't know
				1073	// how to export them from some other block. If this is the first block
				1074	// of the sequence, no exporting is needed.
				1075	if (CurBB == CurMBB \|\|
				1076	(isExportableFromCurrentBlock(BOp->getOperand(0), BB) &&
				1077	isExportableFromCurrentBlock(BOp->getOperand(1), BB))) {
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	1078	ISD::CondCode Condition;
				1079	if (ICmpInst *IC = dyn_cast<ICmpInst>(Cond)) {
Dan Gohman	8c1a6ca	2008-10-17 18:18:45 +0000	[diff] [blame]	1080	Condition = getICmpCondCode(IC->getPredicate());
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	1081	} else if (FCmpInst *FC = dyn_cast<FCmpInst>(Cond)) {
Dan Gohman	8c1a6ca	2008-10-17 18:18:45 +0000	[diff] [blame]	1082	Condition = getFCmpCondCode(FC->getPredicate());
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	1083	} else {
				1084	Condition = ISD::SETEQ; // silence warning.
				1085	assert(0 && "Unknown compare instruction");
				1086	}
Dan Gohman	c227734	2008-10-17 21:16:08 +0000	[diff] [blame]	1087
				1088	CaseBlock CB(Condition, BOp->getOperand(0),
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	1089	BOp->getOperand(1), NULL, TBB, FBB, CurBB);
				1090	SwitchCases.push_back(CB);
				1091	return;
				1092	}
Dan Gohman	c227734	2008-10-17 21:16:08 +0000	[diff] [blame]	1093	}
				1094
				1095	// Create a CaseBlock record representing this branch.
				1096	CaseBlock CB(ISD::SETEQ, Cond, ConstantInt::getTrue(),
				1097	NULL, TBB, FBB, CurBB);
				1098	SwitchCases.push_back(CB);
				1099	}
				1100
				1101	/// FindMergedConditions - If Cond is an expression like
				1102	void SelectionDAGLowering::FindMergedConditions(Value *Cond,
				1103	MachineBasicBlock *TBB,
				1104	MachineBasicBlock *FBB,
				1105	MachineBasicBlock *CurBB,
				1106	unsigned Opc) {
				1107	// If this node is not part of the or/and tree, emit it as a branch.
				1108	Instruction *BOp = dyn_cast<Instruction>(Cond);
				1109	if (!BOp \|\| !(isa<BinaryOperator>(BOp) \|\| isa<CmpInst>(BOp)) \|\|
				1110	(unsigned)BOp->getOpcode() != Opc \|\| !BOp->hasOneUse() \|\|
				1111	BOp->getParent() != CurBB->getBasicBlock() \|\|
				1112	!InBlock(BOp->getOperand(0), CurBB->getBasicBlock()) \|\|
				1113	!InBlock(BOp->getOperand(1), CurBB->getBasicBlock())) {
				1114	EmitBranchForMergedCondition(Cond, TBB, FBB, CurBB);
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	1115	return;
				1116	}
				1117
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	1118	// Create TmpBB after CurBB.
				1119	MachineFunction::iterator BBI = CurBB;
				1120	MachineFunction &MF = DAG.getMachineFunction();
				1121	MachineBasicBlock *TmpBB = MF.CreateMachineBasicBlock(CurBB->getBasicBlock());
				1122	CurBB->getParent()->insert(++BBI, TmpBB);
				1123
				1124	if (Opc == Instruction::Or) {
				1125	// Codegen X \| Y as:
				1126	// jmp_if_X TBB
				1127	// jmp TmpBB
				1128	// TmpBB:
				1129	// jmp_if_Y TBB
				1130	// jmp FBB
				1131	//
				1132
				1133	// Emit the LHS condition.
				1134	FindMergedConditions(BOp->getOperand(0), TBB, TmpBB, CurBB, Opc);
				1135
				1136	// Emit the RHS condition into TmpBB.
				1137	FindMergedConditions(BOp->getOperand(1), TBB, FBB, TmpBB, Opc);
				1138	} else {
				1139	assert(Opc == Instruction::And && "Unknown merge op!");
				1140	// Codegen X & Y as:
				1141	// jmp_if_X TmpBB
				1142	// jmp FBB
				1143	// TmpBB:
				1144	// jmp_if_Y TBB
				1145	// jmp FBB
				1146	//
				1147	// This requires creation of TmpBB after CurBB.
				1148
				1149	// Emit the LHS condition.
				1150	FindMergedConditions(BOp->getOperand(0), TmpBB, FBB, CurBB, Opc);
				1151
				1152	// Emit the RHS condition into TmpBB.
				1153	FindMergedConditions(BOp->getOperand(1), TBB, FBB, TmpBB, Opc);
				1154	}
				1155	}
				1156
				1157	/// If the set of cases should be emitted as a series of branches, return true.
				1158	/// If we should emit this as a bunch of and/or'd together conditions, return
				1159	/// false.
				1160	bool
				1161	SelectionDAGLowering::ShouldEmitAsBranches(const std::vector<CaseBlock> &Cases){
				1162	if (Cases.size() != 2) return true;
				1163
				1164	// If this is two comparisons of the same values or'd or and'd together, they
				1165	// will get folded into a single comparison, so don't emit two blocks.
				1166	if ((Cases[0].CmpLHS == Cases[1].CmpLHS &&
				1167	Cases[0].CmpRHS == Cases[1].CmpRHS) \|\|
				1168	(Cases[0].CmpRHS == Cases[1].CmpLHS &&
				1169	Cases[0].CmpLHS == Cases[1].CmpRHS)) {
				1170	return false;
				1171	}
				1172
				1173	return true;
				1174	}
				1175
				1176	void SelectionDAGLowering::visitBr(BranchInst &I) {
				1177	// Update machine-CFG edges.
				1178	MachineBasicBlock *Succ0MBB = FuncInfo.MBBMap[I.getSuccessor(0)];
				1179
				1180	// Figure out which block is immediately after the current one.
				1181	MachineBasicBlock *NextBlock = 0;
				1182	MachineFunction::iterator BBI = CurMBB;
				1183	if (++BBI != CurMBB->getParent()->end())
				1184	NextBlock = BBI;
				1185
				1186	if (I.isUnconditional()) {
				1187	// Update machine-CFG edges.
				1188	CurMBB->addSuccessor(Succ0MBB);
				1189
				1190	// If this is not a fall-through branch, emit the branch.
				1191	if (Succ0MBB != NextBlock)
				1192	DAG.setRoot(DAG.getNode(ISD::BR, MVT::Other, getControlRoot(),
				1193	DAG.getBasicBlock(Succ0MBB)));
				1194	return;
				1195	}
				1196
				1197	// If this condition is one of the special cases we handle, do special stuff
				1198	// now.
				1199	Value *CondVal = I.getCondition();
				1200	MachineBasicBlock *Succ1MBB = FuncInfo.MBBMap[I.getSuccessor(1)];
				1201
				1202	// If this is a series of conditions that are or'd or and'd together, emit
				1203	// this as a sequence of branches instead of setcc's with and/or operations.
				1204	// For example, instead of something like:
				1205	// cmp A, B
				1206	// C = seteq
				1207	// cmp D, E
				1208	// F = setle
				1209	// or C, F
				1210	// jnz foo
				1211	// Emit:
				1212	// cmp A, B
				1213	// je foo
				1214	// cmp D, E
				1215	// jle foo
				1216	//
				1217	if (BinaryOperator *BOp = dyn_cast<BinaryOperator>(CondVal)) {
				1218	if (BOp->hasOneUse() &&
				1219	(BOp->getOpcode() == Instruction::And \|\|
				1220	BOp->getOpcode() == Instruction::Or)) {
				1221	FindMergedConditions(BOp, Succ0MBB, Succ1MBB, CurMBB, BOp->getOpcode());
				1222	// If the compares in later blocks need to use values not currently
				1223	// exported from this block, export them now. This block should always
				1224	// be the first entry.
				1225	assert(SwitchCases[0].ThisBB == CurMBB && "Unexpected lowering!");
				1226
				1227	// Allow some cases to be rejected.
				1228	if (ShouldEmitAsBranches(SwitchCases)) {
				1229	for (unsigned i = 1, e = SwitchCases.size(); i != e; ++i) {
				1230	ExportFromCurrentBlock(SwitchCases[i].CmpLHS);
				1231	ExportFromCurrentBlock(SwitchCases[i].CmpRHS);
				1232	}
				1233
				1234	// Emit the branch for this block.
				1235	visitSwitchCase(SwitchCases[0]);
				1236	SwitchCases.erase(SwitchCases.begin());
				1237	return;
				1238	}
				1239
				1240	// Okay, we decided not to do this, remove any inserted MBB's and clear
				1241	// SwitchCases.
				1242	for (unsigned i = 1, e = SwitchCases.size(); i != e; ++i)
				1243	CurMBB->getParent()->erase(SwitchCases[i].ThisBB);
				1244
				1245	SwitchCases.clear();
				1246	}
				1247	}
				1248
				1249	// Create a CaseBlock record representing this branch.
				1250	CaseBlock CB(ISD::SETEQ, CondVal, ConstantInt::getTrue(),
				1251	NULL, Succ0MBB, Succ1MBB, CurMBB);
				1252	// Use visitSwitchCase to actually insert the fast branch sequence for this
				1253	// cond branch.
				1254	visitSwitchCase(CB);
				1255	}
				1256
				1257	/// visitSwitchCase - Emits the necessary code to represent a single node in
				1258	/// the binary search tree resulting from lowering a switch instruction.
				1259	void SelectionDAGLowering::visitSwitchCase(CaseBlock &CB) {
				1260	SDValue Cond;
				1261	SDValue CondLHS = getValue(CB.CmpLHS);
				1262
				1263	// Build the setcc now.
				1264	if (CB.CmpMHS == NULL) {
				1265	// Fold "(X == true)" to X and "(X == false)" to !X to
				1266	// handle common cases produced by branch lowering.
				1267	if (CB.CmpRHS == ConstantInt::getTrue() && CB.CC == ISD::SETEQ)
				1268	Cond = CondLHS;
				1269	else if (CB.CmpRHS == ConstantInt::getFalse() && CB.CC == ISD::SETEQ) {
				1270	SDValue True = DAG.getConstant(1, CondLHS.getValueType());
				1271	Cond = DAG.getNode(ISD::XOR, CondLHS.getValueType(), CondLHS, True);
				1272	} else
				1273	Cond = DAG.getSetCC(MVT::i1, CondLHS, getValue(CB.CmpRHS), CB.CC);
				1274	} else {
				1275	assert(CB.CC == ISD::SETLE && "Can handle only LE ranges now");
				1276
				1277	uint64_t Low = cast<ConstantInt>(CB.CmpLHS)->getSExtValue();
				1278	uint64_t High = cast<ConstantInt>(CB.CmpRHS)->getSExtValue();
				1279
				1280	SDValue CmpOp = getValue(CB.CmpMHS);
				1281	MVT VT = CmpOp.getValueType();
				1282
				1283	if (cast<ConstantInt>(CB.CmpLHS)->isMinValue(true)) {
				1284	Cond = DAG.getSetCC(MVT::i1, CmpOp, DAG.getConstant(High, VT), ISD::SETLE);
				1285	} else {
				1286	SDValue SUB = DAG.getNode(ISD::SUB, VT, CmpOp, DAG.getConstant(Low, VT));
				1287	Cond = DAG.getSetCC(MVT::i1, SUB,
				1288	DAG.getConstant(High-Low, VT), ISD::SETULE);
				1289	}
				1290	}
				1291
				1292	// Update successor info
				1293	CurMBB->addSuccessor(CB.TrueBB);
				1294	CurMBB->addSuccessor(CB.FalseBB);
				1295
				1296	// Set NextBlock to be the MBB immediately after the current one, if any.
				1297	// This is used to avoid emitting unnecessary branches to the next block.
				1298	MachineBasicBlock *NextBlock = 0;
				1299	MachineFunction::iterator BBI = CurMBB;
				1300	if (++BBI != CurMBB->getParent()->end())
				1301	NextBlock = BBI;
				1302
				1303	// If the lhs block is the next block, invert the condition so that we can
				1304	// fall through to the lhs instead of the rhs block.
				1305	if (CB.TrueBB == NextBlock) {
				1306	std::swap(CB.TrueBB, CB.FalseBB);
				1307	SDValue True = DAG.getConstant(1, Cond.getValueType());
				1308	Cond = DAG.getNode(ISD::XOR, Cond.getValueType(), Cond, True);
				1309	}
				1310	SDValue BrCond = DAG.getNode(ISD::BRCOND, MVT::Other, getControlRoot(), Cond,
				1311	DAG.getBasicBlock(CB.TrueBB));
				1312
				1313	// If the branch was constant folded, fix up the CFG.
				1314	if (BrCond.getOpcode() == ISD::BR) {
				1315	CurMBB->removeSuccessor(CB.FalseBB);
				1316	DAG.setRoot(BrCond);
				1317	} else {
				1318	// Otherwise, go ahead and insert the false branch.
				1319	if (BrCond == getControlRoot())
				1320	CurMBB->removeSuccessor(CB.TrueBB);
				1321
				1322	if (CB.FalseBB == NextBlock)
				1323	DAG.setRoot(BrCond);
				1324	else
				1325	DAG.setRoot(DAG.getNode(ISD::BR, MVT::Other, BrCond,
				1326	DAG.getBasicBlock(CB.FalseBB)));
				1327	}
				1328	}
				1329
				1330	/// visitJumpTable - Emit JumpTable node in the current MBB
				1331	void SelectionDAGLowering::visitJumpTable(JumpTable &JT) {
				1332	// Emit the code for the jump table
				1333	assert(JT.Reg != -1U && "Should lower JT Header first!");
				1334	MVT PTy = TLI.getPointerTy();
				1335	SDValue Index = DAG.getCopyFromReg(getControlRoot(), JT.Reg, PTy);
				1336	SDValue Table = DAG.getJumpTable(JT.JTI, PTy);
				1337	DAG.setRoot(DAG.getNode(ISD::BR_JT, MVT::Other, Index.getValue(1),
				1338	Table, Index));
				1339	return;
				1340	}
				1341
				1342	/// visitJumpTableHeader - This function emits necessary code to produce index
				1343	/// in the JumpTable from switch case.
				1344	void SelectionDAGLowering::visitJumpTableHeader(JumpTable &JT,
				1345	JumpTableHeader &JTH) {
				1346	// Subtract the lowest switch case value from the value being switched on
				1347	// and conditional branch to default mbb if the result is greater than the
				1348	// difference between smallest and largest cases.
				1349	SDValue SwitchOp = getValue(JTH.SValue);
				1350	MVT VT = SwitchOp.getValueType();
				1351	SDValue SUB = DAG.getNode(ISD::SUB, VT, SwitchOp,
				1352	DAG.getConstant(JTH.First, VT));
				1353
				1354	// The SDNode we just created, which holds the value being switched on
				1355	// minus the the smallest case value, needs to be copied to a virtual
				1356	// register so it can be used as an index into the jump table in a
				1357	// subsequent basic block. This value may be smaller or larger than the
				1358	// target's pointer type, and therefore require extension or truncating.
				1359	if (VT.bitsGT(TLI.getPointerTy()))
				1360	SwitchOp = DAG.getNode(ISD::TRUNCATE, TLI.getPointerTy(), SUB);
				1361	else
				1362	SwitchOp = DAG.getNode(ISD::ZERO_EXTEND, TLI.getPointerTy(), SUB);
				1363
				1364	unsigned JumpTableReg = FuncInfo.MakeReg(TLI.getPointerTy());
				1365	SDValue CopyTo = DAG.getCopyToReg(getControlRoot(), JumpTableReg, SwitchOp);
				1366	JT.Reg = JumpTableReg;
				1367
				1368	// Emit the range check for the jump table, and branch to the default
				1369	// block for the switch statement if the value being switched on exceeds
				1370	// the largest case in the switch.
				1371	SDValue CMP = DAG.getSetCC(TLI.getSetCCResultType(SUB), SUB,
				1372	DAG.getConstant(JTH.Last-JTH.First,VT),
				1373	ISD::SETUGT);
				1374
				1375	// Set NextBlock to be the MBB immediately after the current one, if any.
				1376	// This is used to avoid emitting unnecessary branches to the next block.
				1377	MachineBasicBlock *NextBlock = 0;
				1378	MachineFunction::iterator BBI = CurMBB;
				1379	if (++BBI != CurMBB->getParent()->end())
				1380	NextBlock = BBI;
				1381
				1382	SDValue BrCond = DAG.getNode(ISD::BRCOND, MVT::Other, CopyTo, CMP,
				1383	DAG.getBasicBlock(JT.Default));
				1384
				1385	if (JT.MBB == NextBlock)
				1386	DAG.setRoot(BrCond);
				1387	else
				1388	DAG.setRoot(DAG.getNode(ISD::BR, MVT::Other, BrCond,
				1389	DAG.getBasicBlock(JT.MBB)));
				1390
				1391	return;
				1392	}
				1393
				1394	/// visitBitTestHeader - This function emits necessary code to produce value
				1395	/// suitable for "bit tests"
				1396	void SelectionDAGLowering::visitBitTestHeader(BitTestBlock &B) {
				1397	// Subtract the minimum value
				1398	SDValue SwitchOp = getValue(B.SValue);
				1399	MVT VT = SwitchOp.getValueType();
				1400	SDValue SUB = DAG.getNode(ISD::SUB, VT, SwitchOp,
				1401	DAG.getConstant(B.First, VT));
				1402
				1403	// Check range
				1404	SDValue RangeCmp = DAG.getSetCC(TLI.getSetCCResultType(SUB), SUB,
				1405	DAG.getConstant(B.Range, VT),
				1406	ISD::SETUGT);
				1407
				1408	SDValue ShiftOp;
				1409	if (VT.bitsGT(TLI.getShiftAmountTy()))
				1410	ShiftOp = DAG.getNode(ISD::TRUNCATE, TLI.getShiftAmountTy(), SUB);
				1411	else
				1412	ShiftOp = DAG.getNode(ISD::ZERO_EXTEND, TLI.getShiftAmountTy(), SUB);
				1413
				1414	// Make desired shift
				1415	SDValue SwitchVal = DAG.getNode(ISD::SHL, TLI.getPointerTy(),
				1416	DAG.getConstant(1, TLI.getPointerTy()),
				1417	ShiftOp);
				1418
				1419	unsigned SwitchReg = FuncInfo.MakeReg(TLI.getPointerTy());
				1420	SDValue CopyTo = DAG.getCopyToReg(getControlRoot(), SwitchReg, SwitchVal);
				1421	B.Reg = SwitchReg;
				1422
				1423	// Set NextBlock to be the MBB immediately after the current one, if any.
				1424	// This is used to avoid emitting unnecessary branches to the next block.
				1425	MachineBasicBlock *NextBlock = 0;
				1426	MachineFunction::iterator BBI = CurMBB;
				1427	if (++BBI != CurMBB->getParent()->end())
				1428	NextBlock = BBI;
				1429
				1430	MachineBasicBlock* MBB = B.Cases[0].ThisBB;
				1431
				1432	CurMBB->addSuccessor(B.Default);
				1433	CurMBB->addSuccessor(MBB);
				1434
				1435	SDValue BrRange = DAG.getNode(ISD::BRCOND, MVT::Other, CopyTo, RangeCmp,
				1436	DAG.getBasicBlock(B.Default));
				1437
				1438	if (MBB == NextBlock)
				1439	DAG.setRoot(BrRange);
				1440	else
				1441	DAG.setRoot(DAG.getNode(ISD::BR, MVT::Other, CopyTo,
				1442	DAG.getBasicBlock(MBB)));
				1443
				1444	return;
				1445	}
				1446
				1447	/// visitBitTestCase - this function produces one "bit test"
				1448	void SelectionDAGLowering::visitBitTestCase(MachineBasicBlock* NextMBB,
				1449	unsigned Reg,
				1450	BitTestCase &B) {
				1451	// Emit bit tests and jumps
				1452	SDValue SwitchVal = DAG.getCopyFromReg(getControlRoot(), Reg,
				1453	TLI.getPointerTy());
				1454
				1455	SDValue AndOp = DAG.getNode(ISD::AND, TLI.getPointerTy(), SwitchVal,
				1456	DAG.getConstant(B.Mask, TLI.getPointerTy()));
				1457	SDValue AndCmp = DAG.getSetCC(TLI.getSetCCResultType(AndOp), AndOp,
				1458	DAG.getConstant(0, TLI.getPointerTy()),
				1459	ISD::SETNE);
				1460
				1461	CurMBB->addSuccessor(B.TargetBB);
				1462	CurMBB->addSuccessor(NextMBB);
				1463
				1464	SDValue BrAnd = DAG.getNode(ISD::BRCOND, MVT::Other, getControlRoot(),
				1465	AndCmp, DAG.getBasicBlock(B.TargetBB));
				1466
				1467	// Set NextBlock to be the MBB immediately after the current one, if any.
				1468	// This is used to avoid emitting unnecessary branches to the next block.
				1469	MachineBasicBlock *NextBlock = 0;
				1470	MachineFunction::iterator BBI = CurMBB;
				1471	if (++BBI != CurMBB->getParent()->end())
				1472	NextBlock = BBI;
				1473
				1474	if (NextMBB == NextBlock)
				1475	DAG.setRoot(BrAnd);
				1476	else
				1477	DAG.setRoot(DAG.getNode(ISD::BR, MVT::Other, BrAnd,
				1478	DAG.getBasicBlock(NextMBB)));
				1479
				1480	return;
				1481	}
				1482
				1483	void SelectionDAGLowering::visitInvoke(InvokeInst &I) {
				1484	// Retrieve successors.
				1485	MachineBasicBlock *Return = FuncInfo.MBBMap[I.getSuccessor(0)];
				1486	MachineBasicBlock *LandingPad = FuncInfo.MBBMap[I.getSuccessor(1)];
				1487
				1488	if (isa<InlineAsm>(I.getCalledValue()))
				1489	visitInlineAsm(&I);
				1490	else
				1491	LowerCallTo(&I, getValue(I.getOperand(0)), false, LandingPad);
				1492
				1493	// If the value of the invoke is used outside of its defining block, make it
				1494	// available as a virtual register.
				1495	if (!I.use_empty()) {
				1496	DenseMap<const Value*, unsigned>::iterator VMI = FuncInfo.ValueMap.find(&I);
				1497	if (VMI != FuncInfo.ValueMap.end())
				1498	CopyValueToVirtualRegister(&I, VMI->second);
				1499	}
				1500
				1501	// Update successor info
				1502	CurMBB->addSuccessor(Return);
				1503	CurMBB->addSuccessor(LandingPad);
				1504
				1505	// Drop into normal successor.
				1506	DAG.setRoot(DAG.getNode(ISD::BR, MVT::Other, getControlRoot(),
				1507	DAG.getBasicBlock(Return)));
				1508	}
				1509
				1510	void SelectionDAGLowering::visitUnwind(UnwindInst &I) {
				1511	}
				1512
				1513	/// handleSmallSwitchCaseRange - Emit a series of specific tests (suitable for
				1514	/// small case ranges).
				1515	bool SelectionDAGLowering::handleSmallSwitchRange(CaseRec& CR,
				1516	CaseRecVector& WorkList,
				1517	Value* SV,
				1518	MachineBasicBlock* Default) {
				1519	Case& BackCase = *(CR.Range.second-1);
				1520
				1521	// Size is the number of Cases represented by this range.
				1522	unsigned Size = CR.Range.second - CR.Range.first;
				1523	if (Size > 3)
				1524	return false;
				1525
				1526	// Get the MachineFunction which holds the current MBB. This is used when
				1527	// inserting any additional MBBs necessary to represent the switch.
				1528	MachineFunction *CurMF = CurMBB->getParent();
				1529
				1530	// Figure out which block is immediately after the current one.
				1531	MachineBasicBlock *NextBlock = 0;
				1532	MachineFunction::iterator BBI = CR.CaseBB;
				1533
				1534	if (++BBI != CurMBB->getParent()->end())
				1535	NextBlock = BBI;
				1536
				1537	// TODO: If any two of the cases has the same destination, and if one value
				1538	// is the same as the other, but has one bit unset that the other has set,
				1539	// use bit manipulation to do two compares at once. For example:
				1540	// "if (X == 6 \|\| X == 4)" -> "if ((X\|2) == 6)"
				1541
				1542	// Rearrange the case blocks so that the last one falls through if possible.
				1543	if (NextBlock && Default != NextBlock && BackCase.BB != NextBlock) {
				1544	// The last case block won't fall through into 'NextBlock' if we emit the
				1545	// branches in this order. See if rearranging a case value would help.
				1546	for (CaseItr I = CR.Range.first, E = CR.Range.second-1; I != E; ++I) {
				1547	if (I->BB == NextBlock) {
				1548	std::swap(*I, BackCase);
				1549	break;
				1550	}
				1551	}
				1552	}
				1553
				1554	// Create a CaseBlock record representing a conditional branch to
				1555	// the Case's target mbb if the value being switched on SV is equal
				1556	// to C.
				1557	MachineBasicBlock *CurBlock = CR.CaseBB;
				1558	for (CaseItr I = CR.Range.first, E = CR.Range.second; I != E; ++I) {
				1559	MachineBasicBlock *FallThrough;
				1560	if (I != E-1) {
				1561	FallThrough = CurMF->CreateMachineBasicBlock(CurBlock->getBasicBlock());
				1562	CurMF->insert(BBI, FallThrough);
				1563	} else {
				1564	// If the last case doesn't match, go to the default block.
				1565	FallThrough = Default;
				1566	}
				1567
				1568	Value RHS, LHS, *MHS;
				1569	ISD::CondCode CC;
				1570	if (I->High == I->Low) {
				1571	// This is just small small case range :) containing exactly 1 case
				1572	CC = ISD::SETEQ;
				1573	LHS = SV; RHS = I->High; MHS = NULL;
				1574	} else {
				1575	CC = ISD::SETLE;
				1576	LHS = I->Low; MHS = SV; RHS = I->High;
				1577	}
				1578	CaseBlock CB(CC, LHS, RHS, MHS, I->BB, FallThrough, CurBlock);
				1579
				1580	// If emitting the first comparison, just call visitSwitchCase to emit the
				1581	// code into the current block. Otherwise, push the CaseBlock onto the
				1582	// vector to be later processed by SDISel, and insert the node's MBB
				1583	// before the next MBB.
				1584	if (CurBlock == CurMBB)
				1585	visitSwitchCase(CB);
				1586	else
				1587	SwitchCases.push_back(CB);
				1588
				1589	CurBlock = FallThrough;
				1590	}
				1591
				1592	return true;
				1593	}
				1594
				1595	static inline bool areJTsAllowed(const TargetLowering &TLI) {
				1596	return !DisableJumpTables &&
				1597	(TLI.isOperationLegal(ISD::BR_JT, MVT::Other) \|\|
				1598	TLI.isOperationLegal(ISD::BRIND, MVT::Other));
				1599	}
				1600
				1601	/// handleJTSwitchCase - Emit jumptable for current switch case range
				1602	bool SelectionDAGLowering::handleJTSwitchCase(CaseRec& CR,
				1603	CaseRecVector& WorkList,
				1604	Value* SV,
				1605	MachineBasicBlock* Default) {
				1606	Case& FrontCase = *CR.Range.first;
				1607	Case& BackCase = *(CR.Range.second-1);
				1608
				1609	int64_t First = cast<ConstantInt>(FrontCase.Low)->getSExtValue();
				1610	int64_t Last = cast<ConstantInt>(BackCase.High)->getSExtValue();
				1611
				1612	uint64_t TSize = 0;
				1613	for (CaseItr I = CR.Range.first, E = CR.Range.second;
				1614	I!=E; ++I)
				1615	TSize += I->size();
				1616
				1617	if (!areJTsAllowed(TLI) \|\| TSize <= 3)
				1618	return false;
				1619
				1620	double Density = (double)TSize / (double)((Last - First) + 1ULL);
				1621	if (Density < 0.4)
				1622	return false;
				1623
				1624	DOUT << "Lowering jump table\n"
				1625	<< "First entry: " << First << ". Last entry: " << Last << "\n"
				1626	<< "Size: " << TSize << ". Density: " << Density << "\n\n";
				1627
				1628	// Get the MachineFunction which holds the current MBB. This is used when
				1629	// inserting any additional MBBs necessary to represent the switch.
				1630	MachineFunction *CurMF = CurMBB->getParent();
				1631
				1632	// Figure out which block is immediately after the current one.
				1633	MachineBasicBlock *NextBlock = 0;
				1634	MachineFunction::iterator BBI = CR.CaseBB;
				1635
				1636	if (++BBI != CurMBB->getParent()->end())
				1637	NextBlock = BBI;
				1638
				1639	const BasicBlock *LLVMBB = CR.CaseBB->getBasicBlock();
				1640
				1641	// Create a new basic block to hold the code for loading the address
				1642	// of the jump table, and jumping to it. Update successor information;
				1643	// we will either branch to the default case for the switch, or the jump
				1644	// table.
				1645	MachineBasicBlock *JumpTableBB = CurMF->CreateMachineBasicBlock(LLVMBB);
				1646	CurMF->insert(BBI, JumpTableBB);
				1647	CR.CaseBB->addSuccessor(Default);
				1648	CR.CaseBB->addSuccessor(JumpTableBB);
				1649
				1650	// Build a vector of destination BBs, corresponding to each target
				1651	// of the jump table. If the value of the jump table slot corresponds to
				1652	// a case statement, push the case's BB onto the vector, otherwise, push
				1653	// the default BB.
				1654	std::vector<MachineBasicBlock*> DestBBs;
				1655	int64_t TEI = First;
				1656	for (CaseItr I = CR.Range.first, E = CR.Range.second; I != E; ++TEI) {
				1657	int64_t Low = cast<ConstantInt>(I->Low)->getSExtValue();
				1658	int64_t High = cast<ConstantInt>(I->High)->getSExtValue();
				1659
				1660	if ((Low <= TEI) && (TEI <= High)) {
				1661	DestBBs.push_back(I->BB);
				1662	if (TEI==High)
				1663	++I;
				1664	} else {
				1665	DestBBs.push_back(Default);
				1666	}
				1667	}
				1668
				1669	// Update successor info. Add one edge to each unique successor.
				1670	BitVector SuccsHandled(CR.CaseBB->getParent()->getNumBlockIDs());
				1671	for (std::vector<MachineBasicBlock*>::iterator I = DestBBs.begin(),
				1672	E = DestBBs.end(); I != E; ++I) {
				1673	if (!SuccsHandled[(*I)->getNumber()]) {
				1674	SuccsHandled[(*I)->getNumber()] = true;
				1675	JumpTableBB->addSuccessor(*I);
				1676	}
				1677	}
				1678
				1679	// Create a jump table index for this jump table, or return an existing
				1680	// one.
				1681	unsigned JTI = CurMF->getJumpTableInfo()->getJumpTableIndex(DestBBs);
				1682
				1683	// Set the jump table information so that we can codegen it as a second
				1684	// MachineBasicBlock
				1685	JumpTable JT(-1U, JTI, JumpTableBB, Default);
				1686	JumpTableHeader JTH(First, Last, SV, CR.CaseBB, (CR.CaseBB == CurMBB));
				1687	if (CR.CaseBB == CurMBB)
				1688	visitJumpTableHeader(JT, JTH);
				1689
				1690	JTCases.push_back(JumpTableBlock(JTH, JT));
				1691
				1692	return true;
				1693	}
				1694
				1695	/// handleBTSplitSwitchCase - emit comparison and split binary search tree into
				1696	/// 2 subtrees.
				1697	bool SelectionDAGLowering::handleBTSplitSwitchCase(CaseRec& CR,
				1698	CaseRecVector& WorkList,
				1699	Value* SV,
				1700	MachineBasicBlock* Default) {
				1701	// Get the MachineFunction which holds the current MBB. This is used when
				1702	// inserting any additional MBBs necessary to represent the switch.
				1703	MachineFunction *CurMF = CurMBB->getParent();
				1704
				1705	// Figure out which block is immediately after the current one.
				1706	MachineBasicBlock *NextBlock = 0;
				1707	MachineFunction::iterator BBI = CR.CaseBB;
				1708
				1709	if (++BBI != CurMBB->getParent()->end())
				1710	NextBlock = BBI;
				1711
				1712	Case& FrontCase = *CR.Range.first;
				1713	Case& BackCase = *(CR.Range.second-1);
				1714	const BasicBlock *LLVMBB = CR.CaseBB->getBasicBlock();
				1715
				1716	// Size is the number of Cases represented by this range.
				1717	unsigned Size = CR.Range.second - CR.Range.first;
				1718
				1719	int64_t First = cast<ConstantInt>(FrontCase.Low)->getSExtValue();
				1720	int64_t Last = cast<ConstantInt>(BackCase.High)->getSExtValue();
				1721	double FMetric = 0;
				1722	CaseItr Pivot = CR.Range.first + Size/2;
				1723
				1724	// Select optimal pivot, maximizing sum density of LHS and RHS. This will
				1725	// (heuristically) allow us to emit JumpTable's later.
				1726	uint64_t TSize = 0;
				1727	for (CaseItr I = CR.Range.first, E = CR.Range.second;
				1728	I!=E; ++I)
				1729	TSize += I->size();
				1730
				1731	uint64_t LSize = FrontCase.size();
				1732	uint64_t RSize = TSize-LSize;
				1733	DOUT << "Selecting best pivot: \n"
				1734	<< "First: " << First << ", Last: " << Last <<"\n"
				1735	<< "LSize: " << LSize << ", RSize: " << RSize << "\n";
				1736	for (CaseItr I = CR.Range.first, J=I+1, E = CR.Range.second;
				1737	J!=E; ++I, ++J) {
				1738	int64_t LEnd = cast<ConstantInt>(I->High)->getSExtValue();
				1739	int64_t RBegin = cast<ConstantInt>(J->Low)->getSExtValue();
				1740	assert((RBegin-LEnd>=1) && "Invalid case distance");
				1741	double LDensity = (double)LSize / (double)((LEnd - First) + 1ULL);
				1742	double RDensity = (double)RSize / (double)((Last - RBegin) + 1ULL);
				1743	double Metric = Log2_64(RBegin-LEnd)*(LDensity+RDensity);
				1744	// Should always split in some non-trivial place
				1745	DOUT <<"=>Step\n"
				1746	<< "LEnd: " << LEnd << ", RBegin: " << RBegin << "\n"
				1747	<< "LDensity: " << LDensity << ", RDensity: " << RDensity << "\n"
				1748	<< "Metric: " << Metric << "\n";
				1749	if (FMetric < Metric) {
				1750	Pivot = J;
				1751	FMetric = Metric;
				1752	DOUT << "Current metric set to: " << FMetric << "\n";
				1753	}
				1754
				1755	LSize += J->size();
				1756	RSize -= J->size();
				1757	}
				1758	if (areJTsAllowed(TLI)) {
				1759	// If our case is dense we really should handle it earlier!
				1760	assert((FMetric > 0) && "Should handle dense range earlier!");
				1761	} else {
				1762	Pivot = CR.Range.first + Size/2;
				1763	}
				1764
				1765	CaseRange LHSR(CR.Range.first, Pivot);
				1766	CaseRange RHSR(Pivot, CR.Range.second);
				1767	Constant *C = Pivot->Low;
				1768	MachineBasicBlock FalseBB = 0, TrueBB = 0;
				1769
				1770	// We know that we branch to the LHS if the Value being switched on is
				1771	// less than the Pivot value, C. We use this to optimize our binary
				1772	// tree a bit, by recognizing that if SV is greater than or equal to the
				1773	// LHS's Case Value, and that Case Value is exactly one less than the
				1774	// Pivot's Value, then we can branch directly to the LHS's Target,
				1775	// rather than creating a leaf node for it.
				1776	if ((LHSR.second - LHSR.first) == 1 &&
				1777	LHSR.first->High == CR.GE &&
				1778	cast<ConstantInt>(C)->getSExtValue() ==
				1779	(cast<ConstantInt>(CR.GE)->getSExtValue() + 1LL)) {
				1780	TrueBB = LHSR.first->BB;
				1781	} else {
				1782	TrueBB = CurMF->CreateMachineBasicBlock(LLVMBB);
				1783	CurMF->insert(BBI, TrueBB);
				1784	WorkList.push_back(CaseRec(TrueBB, C, CR.GE, LHSR));
				1785	}
				1786
				1787	// Similar to the optimization above, if the Value being switched on is
				1788	// known to be less than the Constant CR.LT, and the current Case Value
				1789	// is CR.LT - 1, then we can branch directly to the target block for
				1790	// the current Case Value, rather than emitting a RHS leaf node for it.
				1791	if ((RHSR.second - RHSR.first) == 1 && CR.LT &&
				1792	cast<ConstantInt>(RHSR.first->Low)->getSExtValue() ==
				1793	(cast<ConstantInt>(CR.LT)->getSExtValue() - 1LL)) {
				1794	FalseBB = RHSR.first->BB;
				1795	} else {
				1796	FalseBB = CurMF->CreateMachineBasicBlock(LLVMBB);
				1797	CurMF->insert(BBI, FalseBB);
				1798	WorkList.push_back(CaseRec(FalseBB,CR.LT,C,RHSR));
				1799	}
				1800
				1801	// Create a CaseBlock record representing a conditional branch to
				1802	// the LHS node if the value being switched on SV is less than C.
				1803	// Otherwise, branch to LHS.
				1804	CaseBlock CB(ISD::SETLT, SV, C, NULL, TrueBB, FalseBB, CR.CaseBB);
				1805
				1806	if (CR.CaseBB == CurMBB)
				1807	visitSwitchCase(CB);
				1808	else
				1809	SwitchCases.push_back(CB);
				1810
				1811	return true;
				1812	}
				1813
				1814	/// handleBitTestsSwitchCase - if current case range has few destination and
				1815	/// range span less, than machine word bitwidth, encode case range into series
				1816	/// of masks and emit bit tests with these masks.
				1817	bool SelectionDAGLowering::handleBitTestsSwitchCase(CaseRec& CR,
				1818	CaseRecVector& WorkList,
				1819	Value* SV,
				1820	MachineBasicBlock* Default){
				1821	unsigned IntPtrBits = TLI.getPointerTy().getSizeInBits();
				1822
				1823	Case& FrontCase = *CR.Range.first;
				1824	Case& BackCase = *(CR.Range.second-1);
				1825
				1826	// Get the MachineFunction which holds the current MBB. This is used when
				1827	// inserting any additional MBBs necessary to represent the switch.
				1828	MachineFunction *CurMF = CurMBB->getParent();
				1829
				1830	unsigned numCmps = 0;
				1831	for (CaseItr I = CR.Range.first, E = CR.Range.second;
				1832	I!=E; ++I) {
				1833	// Single case counts one, case range - two.
				1834	if (I->Low == I->High)
				1835	numCmps +=1;
				1836	else
				1837	numCmps +=2;
				1838	}
				1839
				1840	// Count unique destinations
				1841	SmallSet<MachineBasicBlock*, 4> Dests;
				1842	for (CaseItr I = CR.Range.first, E = CR.Range.second; I!=E; ++I) {
				1843	Dests.insert(I->BB);
				1844	if (Dests.size() > 3)
				1845	// Don't bother the code below, if there are too much unique destinations
				1846	return false;
				1847	}
				1848	DOUT << "Total number of unique destinations: " << Dests.size() << "\n"
				1849	<< "Total number of comparisons: " << numCmps << "\n";
				1850
				1851	// Compute span of values.
				1852	Constant* minValue = FrontCase.Low;
				1853	Constant* maxValue = BackCase.High;
				1854	uint64_t range = cast<ConstantInt>(maxValue)->getSExtValue() -
				1855	cast<ConstantInt>(minValue)->getSExtValue();
				1856	DOUT << "Compare range: " << range << "\n"
				1857	<< "Low bound: " << cast<ConstantInt>(minValue)->getSExtValue() << "\n"
				1858	<< "High bound: " << cast<ConstantInt>(maxValue)->getSExtValue() << "\n";
				1859
				1860	if (range>=IntPtrBits \|\|
				1861	(!(Dests.size() == 1 && numCmps >= 3) &&
				1862	!(Dests.size() == 2 && numCmps >= 5) &&
				1863	!(Dests.size() >= 3 && numCmps >= 6)))
				1864	return false;
				1865
				1866	DOUT << "Emitting bit tests\n";
				1867	int64_t lowBound = 0;
				1868
				1869	// Optimize the case where all the case values fit in a
				1870	// word without having to subtract minValue. In this case,
				1871	// we can optimize away the subtraction.
				1872	if (cast<ConstantInt>(minValue)->getSExtValue() >= 0 &&
				1873	cast<ConstantInt>(maxValue)->getSExtValue() < IntPtrBits) {
				1874	range = cast<ConstantInt>(maxValue)->getSExtValue();
				1875	} else {
				1876	lowBound = cast<ConstantInt>(minValue)->getSExtValue();
				1877	}
				1878
				1879	CaseBitsVector CasesBits;
				1880	unsigned i, count = 0;
				1881
				1882	for (CaseItr I = CR.Range.first, E = CR.Range.second; I!=E; ++I) {
				1883	MachineBasicBlock* Dest = I->BB;
				1884	for (i = 0; i < count; ++i)
				1885	if (Dest == CasesBits[i].BB)
				1886	break;
				1887
				1888	if (i == count) {
				1889	assert((count < 3) && "Too much destinations to test!");
				1890	CasesBits.push_back(CaseBits(0, Dest, 0));
				1891	count++;
				1892	}
				1893
				1894	uint64_t lo = cast<ConstantInt>(I->Low)->getSExtValue() - lowBound;
				1895	uint64_t hi = cast<ConstantInt>(I->High)->getSExtValue() - lowBound;
				1896
				1897	for (uint64_t j = lo; j <= hi; j++) {
				1898	CasesBits[i].Mask \|= 1ULL << j;
				1899	CasesBits[i].Bits++;
				1900	}
				1901
				1902	}
				1903	std::sort(CasesBits.begin(), CasesBits.end(), CaseBitsCmp());
				1904
				1905	BitTestInfo BTC;
				1906
				1907	// Figure out which block is immediately after the current one.
				1908	MachineFunction::iterator BBI = CR.CaseBB;
				1909	++BBI;
				1910
				1911	const BasicBlock *LLVMBB = CR.CaseBB->getBasicBlock();
				1912
				1913	DOUT << "Cases:\n";
				1914	for (unsigned i = 0, e = CasesBits.size(); i!=e; ++i) {
				1915	DOUT << "Mask: " << CasesBits[i].Mask << ", Bits: " << CasesBits[i].Bits
				1916	<< ", BB: " << CasesBits[i].BB << "\n";
				1917
				1918	MachineBasicBlock *CaseBB = CurMF->CreateMachineBasicBlock(LLVMBB);
				1919	CurMF->insert(BBI, CaseBB);
				1920	BTC.push_back(BitTestCase(CasesBits[i].Mask,
				1921	CaseBB,
				1922	CasesBits[i].BB));
				1923	}
				1924
				1925	BitTestBlock BTB(lowBound, range, SV,
				1926	-1U, (CR.CaseBB == CurMBB),
				1927	CR.CaseBB, Default, BTC);
				1928
				1929	if (CR.CaseBB == CurMBB)
				1930	visitBitTestHeader(BTB);
				1931
				1932	BitTestCases.push_back(BTB);
				1933
				1934	return true;
				1935	}
				1936
				1937
				1938	/// Clusterify - Transform simple list of Cases into list of CaseRange's
				1939	unsigned SelectionDAGLowering::Clusterify(CaseVector& Cases,
				1940	const SwitchInst& SI) {
				1941	unsigned numCmps = 0;
				1942
				1943	// Start with "simple" cases
				1944	for (unsigned i = 1; i < SI.getNumSuccessors(); ++i) {
				1945	MachineBasicBlock *SMBB = FuncInfo.MBBMap[SI.getSuccessor(i)];
				1946	Cases.push_back(Case(SI.getSuccessorValue(i),
				1947	SI.getSuccessorValue(i),
				1948	SMBB));
				1949	}
				1950	std::sort(Cases.begin(), Cases.end(), CaseCmp());
				1951
				1952	// Merge case into clusters
				1953	if (Cases.size()>=2)
				1954	// Must recompute end() each iteration because it may be
				1955	// invalidated by erase if we hold on to it
				1956	for (CaseItr I=Cases.begin(), J=++(Cases.begin()); J!=Cases.end(); ) {
				1957	int64_t nextValue = cast<ConstantInt>(J->Low)->getSExtValue();
				1958	int64_t currentValue = cast<ConstantInt>(I->High)->getSExtValue();
				1959	MachineBasicBlock* nextBB = J->BB;
				1960	MachineBasicBlock* currentBB = I->BB;
				1961
				1962	// If the two neighboring cases go to the same destination, merge them
				1963	// into a single case.
				1964	if ((nextValue-currentValue==1) && (currentBB == nextBB)) {
				1965	I->High = J->High;
				1966	J = Cases.erase(J);
				1967	} else {
				1968	I = J++;
				1969	}
				1970	}
				1971
				1972	for (CaseItr I=Cases.begin(), E=Cases.end(); I!=E; ++I, ++numCmps) {
				1973	if (I->Low != I->High)
				1974	// A range counts double, since it requires two compares.
				1975	++numCmps;
				1976	}
				1977
				1978	return numCmps;
				1979	}
				1980
				1981	void SelectionDAGLowering::visitSwitch(SwitchInst &SI) {
				1982	// Figure out which block is immediately after the current one.
				1983	MachineBasicBlock *NextBlock = 0;
				1984	MachineFunction::iterator BBI = CurMBB;
				1985
				1986	MachineBasicBlock *Default = FuncInfo.MBBMap[SI.getDefaultDest()];
				1987
				1988	// If there is only the default destination, branch to it if it is not the
				1989	// next basic block. Otherwise, just fall through.
				1990	if (SI.getNumOperands() == 2) {
				1991	// Update machine-CFG edges.
				1992
				1993	// If this is not a fall-through branch, emit the branch.
				1994	CurMBB->addSuccessor(Default);
				1995	if (Default != NextBlock)
				1996	DAG.setRoot(DAG.getNode(ISD::BR, MVT::Other, getControlRoot(),
				1997	DAG.getBasicBlock(Default)));
				1998
				1999	return;
				2000	}
				2001
				2002	// If there are any non-default case statements, create a vector of Cases
				2003	// representing each one, and sort the vector so that we can efficiently
				2004	// create a binary search tree from them.
				2005	CaseVector Cases;
				2006	unsigned numCmps = Clusterify(Cases, SI);
				2007	DOUT << "Clusterify finished. Total clusters: " << Cases.size()
				2008	<< ". Total compares: " << numCmps << "\n";
				2009
				2010	// Get the Value to be switched on and default basic blocks, which will be
				2011	// inserted into CaseBlock records, representing basic blocks in the binary
				2012	// search tree.
				2013	Value *SV = SI.getOperand(0);
				2014
				2015	// Push the initial CaseRec onto the worklist
				2016	CaseRecVector WorkList;
				2017	WorkList.push_back(CaseRec(CurMBB,0,0,CaseRange(Cases.begin(),Cases.end())));
				2018
				2019	while (!WorkList.empty()) {
				2020	// Grab a record representing a case range to process off the worklist
				2021	CaseRec CR = WorkList.back();
				2022	WorkList.pop_back();
				2023
				2024	if (handleBitTestsSwitchCase(CR, WorkList, SV, Default))
				2025	continue;
				2026
				2027	// If the range has few cases (two or less) emit a series of specific
				2028	// tests.
				2029	if (handleSmallSwitchRange(CR, WorkList, SV, Default))
				2030	continue;
				2031
				2032	// If the switch has more than 5 blocks, and at least 40% dense, and the
				2033	// target supports indirect branches, then emit a jump table rather than
				2034	// lowering the switch to a binary tree of conditional branches.
				2035	if (handleJTSwitchCase(CR, WorkList, SV, Default))
				2036	continue;
				2037
				2038	// Emit binary tree. We need to pick a pivot, and push left and right ranges
				2039	// onto the worklist. Leafs are handled via handleSmallSwitchRange() call.
				2040	handleBTSplitSwitchCase(CR, WorkList, SV, Default);
				2041	}
				2042	}
				2043
				2044
				2045	void SelectionDAGLowering::visitSub(User &I) {
				2046	// -0.0 - X --> fneg
				2047	const Type *Ty = I.getType();
				2048	if (isa<VectorType>(Ty)) {
				2049	if (ConstantVector *CV = dyn_cast<ConstantVector>(I.getOperand(0))) {
				2050	const VectorType *DestTy = cast<VectorType>(I.getType());
				2051	const Type *ElTy = DestTy->getElementType();
				2052	if (ElTy->isFloatingPoint()) {
				2053	unsigned VL = DestTy->getNumElements();
				2054	std::vector<Constant*> NZ(VL, ConstantFP::getNegativeZero(ElTy));
				2055	Constant *CNZ = ConstantVector::get(&NZ[0], NZ.size());
				2056	if (CV == CNZ) {
				2057	SDValue Op2 = getValue(I.getOperand(1));
				2058	setValue(&I, DAG.getNode(ISD::FNEG, Op2.getValueType(), Op2));
				2059	return;
				2060	}
				2061	}
				2062	}
				2063	}
				2064	if (Ty->isFloatingPoint()) {
				2065	if (ConstantFP *CFP = dyn_cast<ConstantFP>(I.getOperand(0)))
				2066	if (CFP->isExactlyValue(ConstantFP::getNegativeZero(Ty)->getValueAPF())) {
				2067	SDValue Op2 = getValue(I.getOperand(1));
				2068	setValue(&I, DAG.getNode(ISD::FNEG, Op2.getValueType(), Op2));
				2069	return;
				2070	}
				2071	}
				2072
				2073	visitBinary(I, Ty->isFPOrFPVector() ? ISD::FSUB : ISD::SUB);
				2074	}
				2075
				2076	void SelectionDAGLowering::visitBinary(User &I, unsigned OpCode) {
				2077	SDValue Op1 = getValue(I.getOperand(0));
				2078	SDValue Op2 = getValue(I.getOperand(1));
				2079
				2080	setValue(&I, DAG.getNode(OpCode, Op1.getValueType(), Op1, Op2));
				2081	}
				2082
				2083	void SelectionDAGLowering::visitShift(User &I, unsigned Opcode) {
				2084	SDValue Op1 = getValue(I.getOperand(0));
				2085	SDValue Op2 = getValue(I.getOperand(1));
				2086	if (!isa<VectorType>(I.getType())) {
				2087	if (TLI.getShiftAmountTy().bitsLT(Op2.getValueType()))
				2088	Op2 = DAG.getNode(ISD::TRUNCATE, TLI.getShiftAmountTy(), Op2);
				2089	else if (TLI.getShiftAmountTy().bitsGT(Op2.getValueType()))
				2090	Op2 = DAG.getNode(ISD::ANY_EXTEND, TLI.getShiftAmountTy(), Op2);
				2091	}
				2092
				2093	setValue(&I, DAG.getNode(Opcode, Op1.getValueType(), Op1, Op2));
				2094	}
				2095
				2096	void SelectionDAGLowering::visitICmp(User &I) {
				2097	ICmpInst::Predicate predicate = ICmpInst::BAD_ICMP_PREDICATE;
				2098	if (ICmpInst *IC = dyn_cast<ICmpInst>(&I))
				2099	predicate = IC->getPredicate();
				2100	else if (ConstantExpr *IC = dyn_cast<ConstantExpr>(&I))
				2101	predicate = ICmpInst::Predicate(IC->getPredicate());
				2102	SDValue Op1 = getValue(I.getOperand(0));
				2103	SDValue Op2 = getValue(I.getOperand(1));
Dan Gohman	8c1a6ca	2008-10-17 18:18:45 +0000	[diff] [blame]	2104	ISD::CondCode Opcode = getICmpCondCode(predicate);
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	2105	setValue(&I, DAG.getSetCC(MVT::i1, Op1, Op2, Opcode));
				2106	}
				2107
				2108	void SelectionDAGLowering::visitFCmp(User &I) {
				2109	FCmpInst::Predicate predicate = FCmpInst::BAD_FCMP_PREDICATE;
				2110	if (FCmpInst *FC = dyn_cast<FCmpInst>(&I))
				2111	predicate = FC->getPredicate();
				2112	else if (ConstantExpr *FC = dyn_cast<ConstantExpr>(&I))
				2113	predicate = FCmpInst::Predicate(FC->getPredicate());
				2114	SDValue Op1 = getValue(I.getOperand(0));
				2115	SDValue Op2 = getValue(I.getOperand(1));
Dan Gohman	8c1a6ca	2008-10-17 18:18:45 +0000	[diff] [blame]	2116	ISD::CondCode Condition = getFCmpCondCode(predicate);
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	2117	setValue(&I, DAG.getSetCC(MVT::i1, Op1, Op2, Condition));
				2118	}
				2119
				2120	void SelectionDAGLowering::visitVICmp(User &I) {
				2121	ICmpInst::Predicate predicate = ICmpInst::BAD_ICMP_PREDICATE;
				2122	if (VICmpInst *IC = dyn_cast<VICmpInst>(&I))
				2123	predicate = IC->getPredicate();
				2124	else if (ConstantExpr *IC = dyn_cast<ConstantExpr>(&I))
				2125	predicate = ICmpInst::Predicate(IC->getPredicate());
				2126	SDValue Op1 = getValue(I.getOperand(0));
				2127	SDValue Op2 = getValue(I.getOperand(1));
Dan Gohman	8c1a6ca	2008-10-17 18:18:45 +0000	[diff] [blame]	2128	ISD::CondCode Opcode = getICmpCondCode(predicate);
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	2129	setValue(&I, DAG.getVSetCC(Op1.getValueType(), Op1, Op2, Opcode));
				2130	}
				2131
				2132	void SelectionDAGLowering::visitVFCmp(User &I) {
				2133	FCmpInst::Predicate predicate = FCmpInst::BAD_FCMP_PREDICATE;
				2134	if (VFCmpInst *FC = dyn_cast<VFCmpInst>(&I))
				2135	predicate = FC->getPredicate();
				2136	else if (ConstantExpr *FC = dyn_cast<ConstantExpr>(&I))
				2137	predicate = FCmpInst::Predicate(FC->getPredicate());
				2138	SDValue Op1 = getValue(I.getOperand(0));
				2139	SDValue Op2 = getValue(I.getOperand(1));
Dan Gohman	8c1a6ca	2008-10-17 18:18:45 +0000	[diff] [blame]	2140	ISD::CondCode Condition = getFCmpCondCode(predicate);
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	2141	MVT DestVT = TLI.getValueType(I.getType());
				2142
				2143	setValue(&I, DAG.getVSetCC(DestVT, Op1, Op2, Condition));
				2144	}
				2145
				2146	void SelectionDAGLowering::visitSelect(User &I) {
Dan Gohman	7ea1ca6	2008-10-21 20:00:42 +0000	[diff] [blame]	2147	SmallVector<MVT, 4> ValueVTs;
				2148	ComputeValueVTs(TLI, I.getType(), ValueVTs);
				2149	unsigned NumValues = ValueVTs.size();
				2150	if (NumValues != 0) {
				2151	SmallVector<SDValue, 4> Values(NumValues);
				2152	SDValue Cond = getValue(I.getOperand(0));
				2153	SDValue TrueVal = getValue(I.getOperand(1));
				2154	SDValue FalseVal = getValue(I.getOperand(2));
				2155
				2156	for (unsigned i = 0; i != NumValues; ++i)
				2157	Values[i] = DAG.getNode(ISD::SELECT, TrueVal.getValueType(), Cond,
				2158	SDValue(TrueVal.getNode(), TrueVal.getResNo() + i),
				2159	SDValue(FalseVal.getNode(), FalseVal.getResNo() + i));
				2160
Duncan Sands	aaffa05	2008-12-01 11:41:29 +0000	[diff] [blame]	2161	setValue(&I, DAG.getNode(ISD::MERGE_VALUES,
				2162	DAG.getVTList(&ValueVTs[0], NumValues),
				2163	&Values[0], NumValues));
Dan Gohman	7ea1ca6	2008-10-21 20:00:42 +0000	[diff] [blame]	2164	}
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	2165	}
				2166
				2167
				2168	void SelectionDAGLowering::visitTrunc(User &I) {
				2169	// TruncInst cannot be a no-op cast because sizeof(src) > sizeof(dest).
				2170	SDValue N = getValue(I.getOperand(0));
				2171	MVT DestVT = TLI.getValueType(I.getType());
				2172	setValue(&I, DAG.getNode(ISD::TRUNCATE, DestVT, N));
				2173	}
				2174
				2175	void SelectionDAGLowering::visitZExt(User &I) {
				2176	// ZExt cannot be a no-op cast because sizeof(src) < sizeof(dest).
				2177	// ZExt also can't be a cast to bool for same reason. So, nothing much to do
				2178	SDValue N = getValue(I.getOperand(0));
				2179	MVT DestVT = TLI.getValueType(I.getType());
				2180	setValue(&I, DAG.getNode(ISD::ZERO_EXTEND, DestVT, N));
				2181	}
				2182
				2183	void SelectionDAGLowering::visitSExt(User &I) {
				2184	// SExt cannot be a no-op cast because sizeof(src) < sizeof(dest).
				2185	// SExt also can't be a cast to bool for same reason. So, nothing much to do
				2186	SDValue N = getValue(I.getOperand(0));
				2187	MVT DestVT = TLI.getValueType(I.getType());
				2188	setValue(&I, DAG.getNode(ISD::SIGN_EXTEND, DestVT, N));
				2189	}
				2190
				2191	void SelectionDAGLowering::visitFPTrunc(User &I) {
				2192	// FPTrunc is never a no-op cast, no need to check
				2193	SDValue N = getValue(I.getOperand(0));
				2194	MVT DestVT = TLI.getValueType(I.getType());
				2195	setValue(&I, DAG.getNode(ISD::FP_ROUND, DestVT, N, DAG.getIntPtrConstant(0)));
				2196	}
				2197
				2198	void SelectionDAGLowering::visitFPExt(User &I){
				2199	// FPTrunc is never a no-op cast, no need to check
				2200	SDValue N = getValue(I.getOperand(0));
				2201	MVT DestVT = TLI.getValueType(I.getType());
				2202	setValue(&I, DAG.getNode(ISD::FP_EXTEND, DestVT, N));
				2203	}
				2204
				2205	void SelectionDAGLowering::visitFPToUI(User &I) {
				2206	// FPToUI is never a no-op cast, no need to check
				2207	SDValue N = getValue(I.getOperand(0));
				2208	MVT DestVT = TLI.getValueType(I.getType());
				2209	setValue(&I, DAG.getNode(ISD::FP_TO_UINT, DestVT, N));
				2210	}
				2211
				2212	void SelectionDAGLowering::visitFPToSI(User &I) {
				2213	// FPToSI is never a no-op cast, no need to check
				2214	SDValue N = getValue(I.getOperand(0));
				2215	MVT DestVT = TLI.getValueType(I.getType());
				2216	setValue(&I, DAG.getNode(ISD::FP_TO_SINT, DestVT, N));
				2217	}
				2218
				2219	void SelectionDAGLowering::visitUIToFP(User &I) {
				2220	// UIToFP is never a no-op cast, no need to check
				2221	SDValue N = getValue(I.getOperand(0));
				2222	MVT DestVT = TLI.getValueType(I.getType());
				2223	setValue(&I, DAG.getNode(ISD::UINT_TO_FP, DestVT, N));
				2224	}
				2225
				2226	void SelectionDAGLowering::visitSIToFP(User &I){
Bill Wendling	181b627	2008-10-19 20:34:04 +0000	[diff] [blame]	2227	// SIToFP is never a no-op cast, no need to check
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	2228	SDValue N = getValue(I.getOperand(0));
				2229	MVT DestVT = TLI.getValueType(I.getType());
				2230	setValue(&I, DAG.getNode(ISD::SINT_TO_FP, DestVT, N));
				2231	}
				2232
				2233	void SelectionDAGLowering::visitPtrToInt(User &I) {
				2234	// What to do depends on the size of the integer and the size of the pointer.
				2235	// We can either truncate, zero extend, or no-op, accordingly.
				2236	SDValue N = getValue(I.getOperand(0));
				2237	MVT SrcVT = N.getValueType();
				2238	MVT DestVT = TLI.getValueType(I.getType());
				2239	SDValue Result;
				2240	if (DestVT.bitsLT(SrcVT))
				2241	Result = DAG.getNode(ISD::TRUNCATE, DestVT, N);
				2242	else
				2243	// Note: ZERO_EXTEND can handle cases where the sizes are equal too
				2244	Result = DAG.getNode(ISD::ZERO_EXTEND, DestVT, N);
				2245	setValue(&I, Result);
				2246	}
				2247
				2248	void SelectionDAGLowering::visitIntToPtr(User &I) {
				2249	// What to do depends on the size of the integer and the size of the pointer.
				2250	// We can either truncate, zero extend, or no-op, accordingly.
				2251	SDValue N = getValue(I.getOperand(0));
				2252	MVT SrcVT = N.getValueType();
				2253	MVT DestVT = TLI.getValueType(I.getType());
				2254	if (DestVT.bitsLT(SrcVT))
				2255	setValue(&I, DAG.getNode(ISD::TRUNCATE, DestVT, N));
				2256	else
				2257	// Note: ZERO_EXTEND can handle cases where the sizes are equal too
				2258	setValue(&I, DAG.getNode(ISD::ZERO_EXTEND, DestVT, N));
				2259	}
				2260
				2261	void SelectionDAGLowering::visitBitCast(User &I) {
				2262	SDValue N = getValue(I.getOperand(0));
				2263	MVT DestVT = TLI.getValueType(I.getType());
				2264
				2265	// BitCast assures us that source and destination are the same size so this
				2266	// is either a BIT_CONVERT or a no-op.
				2267	if (DestVT != N.getValueType())
				2268	setValue(&I, DAG.getNode(ISD::BIT_CONVERT, DestVT, N)); // convert types
				2269	else
				2270	setValue(&I, N); // noop cast.
				2271	}
				2272
				2273	void SelectionDAGLowering::visitInsertElement(User &I) {
				2274	SDValue InVec = getValue(I.getOperand(0));
				2275	SDValue InVal = getValue(I.getOperand(1));
				2276	SDValue InIdx = DAG.getNode(ISD::ZERO_EXTEND, TLI.getPointerTy(),
				2277	getValue(I.getOperand(2)));
				2278
				2279	setValue(&I, DAG.getNode(ISD::INSERT_VECTOR_ELT,
				2280	TLI.getValueType(I.getType()),
				2281	InVec, InVal, InIdx));
				2282	}
				2283
				2284	void SelectionDAGLowering::visitExtractElement(User &I) {
				2285	SDValue InVec = getValue(I.getOperand(0));
				2286	SDValue InIdx = DAG.getNode(ISD::ZERO_EXTEND, TLI.getPointerTy(),
				2287	getValue(I.getOperand(1)));
				2288	setValue(&I, DAG.getNode(ISD::EXTRACT_VECTOR_ELT,
				2289	TLI.getValueType(I.getType()), InVec, InIdx));
				2290	}
				2291
Mon P Wang	aeb06d2	2008-11-10 04:46:22 +0000	[diff] [blame]	2292
				2293	// Utility for visitShuffleVector - Returns true if the mask is mask starting
				2294	// from SIndx and increasing to the element length (undefs are allowed).
				2295	static bool SequentialMask(SDValue Mask, unsigned SIndx) {
Mon P Wang	c7849c2	2008-11-16 05:06:27 +0000	[diff] [blame]	2296	unsigned MaskNumElts = Mask.getNumOperands();
				2297	for (unsigned i = 0; i != MaskNumElts; ++i) {
Mon P Wang	aeb06d2	2008-11-10 04:46:22 +0000	[diff] [blame]	2298	if (Mask.getOperand(i).getOpcode() != ISD::UNDEF) {
				2299	unsigned Idx = cast<ConstantSDNode>(Mask.getOperand(i))->getZExtValue();
				2300	if (Idx != i + SIndx)
				2301	return false;
				2302	}
				2303	}
				2304	return true;
				2305	}
				2306
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	2307	void SelectionDAGLowering::visitShuffleVector(User &I) {
Mon P Wang	230e4fa	2008-11-21 04:25:21 +0000	[diff] [blame]	2308	SDValue Src1 = getValue(I.getOperand(0));
				2309	SDValue Src2 = getValue(I.getOperand(1));
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	2310	SDValue Mask = getValue(I.getOperand(2));
				2311
Mon P Wang	aeb06d2	2008-11-10 04:46:22 +0000	[diff] [blame]	2312	MVT VT = TLI.getValueType(I.getType());
Mon P Wang	230e4fa	2008-11-21 04:25:21 +0000	[diff] [blame]	2313	MVT SrcVT = Src1.getValueType();
Mon P Wang	c7849c2	2008-11-16 05:06:27 +0000	[diff] [blame]	2314	int MaskNumElts = Mask.getNumOperands();
				2315	int SrcNumElts = SrcVT.getVectorNumElements();
Mon P Wang	aeb06d2	2008-11-10 04:46:22 +0000	[diff] [blame]	2316
Mon P Wang	c7849c2	2008-11-16 05:06:27 +0000	[diff] [blame]	2317	if (SrcNumElts == MaskNumElts) {
Mon P Wang	230e4fa	2008-11-21 04:25:21 +0000	[diff] [blame]	2318	setValue(&I, DAG.getNode(ISD::VECTOR_SHUFFLE, VT, Src1, Src2, Mask));
Mon P Wang	aeb06d2	2008-11-10 04:46:22 +0000	[diff] [blame]	2319	return;
				2320	}
				2321
				2322	// Normalize the shuffle vector since mask and vector length don't match.
Mon P Wang	c7849c2	2008-11-16 05:06:27 +0000	[diff] [blame]	2323	MVT MaskEltVT = Mask.getValueType().getVectorElementType();
				2324
				2325	if (SrcNumElts < MaskNumElts && MaskNumElts % SrcNumElts == 0) {
				2326	// Mask is longer than the source vectors and is a multiple of the source
				2327	// vectors. We can use concatenate vector to make the mask and vectors
Mon P Wang	230e4fa	2008-11-21 04:25:21 +0000	[diff] [blame]	2328	// lengths match.
Mon P Wang	c7849c2	2008-11-16 05:06:27 +0000	[diff] [blame]	2329	if (SrcNumElts*2 == MaskNumElts && SequentialMask(Mask, 0)) {
				2330	// The shuffle is concatenating two vectors together.
Mon P Wang	230e4fa	2008-11-21 04:25:21 +0000	[diff] [blame]	2331	setValue(&I, DAG.getNode(ISD::CONCAT_VECTORS, VT, Src1, Src2));
Mon P Wang	aeb06d2	2008-11-10 04:46:22 +0000	[diff] [blame]	2332	return;
				2333	}
				2334
Mon P Wang	c7849c2	2008-11-16 05:06:27 +0000	[diff] [blame]	2335	// Pad both vectors with undefs to make them the same length as the mask.
				2336	unsigned NumConcat = MaskNumElts / SrcNumElts;
				2337	SDValue UndefVal = DAG.getNode(ISD::UNDEF, SrcVT);
Mon P Wang	aeb06d2	2008-11-10 04:46:22 +0000	[diff] [blame]	2338
Mon P Wang	230e4fa	2008-11-21 04:25:21 +0000	[diff] [blame]	2339	SDValue* MOps1 = new SDValue[NumConcat];
				2340	SDValue* MOps2 = new SDValue[NumConcat];
				2341	MOps1[0] = Src1;
				2342	MOps2[0] = Src2;
Mon P Wang	aeb06d2	2008-11-10 04:46:22 +0000	[diff] [blame]	2343	for (unsigned i = 1; i != NumConcat; ++i) {
Mon P Wang	230e4fa	2008-11-21 04:25:21 +0000	[diff] [blame]	2344	MOps1[i] = UndefVal;
				2345	MOps2[i] = UndefVal;
Mon P Wang	aeb06d2	2008-11-10 04:46:22 +0000	[diff] [blame]	2346	}
Mon P Wang	230e4fa	2008-11-21 04:25:21 +0000	[diff] [blame]	2347	Src1 = DAG.getNode(ISD::CONCAT_VECTORS, VT, MOps1, NumConcat);
				2348	Src2 = DAG.getNode(ISD::CONCAT_VECTORS, VT, MOps2, NumConcat);
				2349
				2350	delete [] MOps1;
				2351	delete [] MOps2;
				2352
Mon P Wang	aeb06d2	2008-11-10 04:46:22 +0000	[diff] [blame]	2353	// Readjust mask for new input vector length.
				2354	SmallVector<SDValue, 8> MappedOps;
Mon P Wang	c7849c2	2008-11-16 05:06:27 +0000	[diff] [blame]	2355	for (int i = 0; i != MaskNumElts; ++i) {
Mon P Wang	aeb06d2	2008-11-10 04:46:22 +0000	[diff] [blame]	2356	if (Mask.getOperand(i).getOpcode() == ISD::UNDEF) {
				2357	MappedOps.push_back(Mask.getOperand(i));
				2358	} else {
Mon P Wang	c7849c2	2008-11-16 05:06:27 +0000	[diff] [blame]	2359	int Idx = cast<ConstantSDNode>(Mask.getOperand(i))->getZExtValue();
				2360	if (Idx < SrcNumElts)
				2361	MappedOps.push_back(DAG.getConstant(Idx, MaskEltVT));
				2362	else
				2363	MappedOps.push_back(DAG.getConstant(Idx + MaskNumElts - SrcNumElts,
				2364	MaskEltVT));
Mon P Wang	aeb06d2	2008-11-10 04:46:22 +0000	[diff] [blame]	2365	}
				2366	}
				2367	Mask = DAG.getNode(ISD::BUILD_VECTOR, Mask.getValueType(),
				2368	&MappedOps[0], MappedOps.size());
				2369
Mon P Wang	230e4fa	2008-11-21 04:25:21 +0000	[diff] [blame]	2370	setValue(&I, DAG.getNode(ISD::VECTOR_SHUFFLE, VT, Src1, Src2, Mask));
Mon P Wang	aeb06d2	2008-11-10 04:46:22 +0000	[diff] [blame]	2371	return;
				2372	}
				2373
Mon P Wang	c7849c2	2008-11-16 05:06:27 +0000	[diff] [blame]	2374	if (SrcNumElts > MaskNumElts) {
Mon P Wang	aeb06d2	2008-11-10 04:46:22 +0000	[diff] [blame]	2375	// Resulting vector is shorter than the incoming vector.
Mon P Wang	c7849c2	2008-11-16 05:06:27 +0000	[diff] [blame]	2376	if (SrcNumElts == MaskNumElts && SequentialMask(Mask,0)) {
Mon P Wang	aeb06d2	2008-11-10 04:46:22 +0000	[diff] [blame]	2377	// Shuffle extracts 1st vector.
Mon P Wang	230e4fa	2008-11-21 04:25:21 +0000	[diff] [blame]	2378	setValue(&I, Src1);
Mon P Wang	aeb06d2	2008-11-10 04:46:22 +0000	[diff] [blame]	2379	return;
				2380	}
				2381
Mon P Wang	c7849c2	2008-11-16 05:06:27 +0000	[diff] [blame]	2382	if (SrcNumElts == MaskNumElts && SequentialMask(Mask,MaskNumElts)) {
Mon P Wang	aeb06d2	2008-11-10 04:46:22 +0000	[diff] [blame]	2383	// Shuffle extracts 2nd vector.
Mon P Wang	230e4fa	2008-11-21 04:25:21 +0000	[diff] [blame]	2384	setValue(&I, Src2);
Mon P Wang	aeb06d2	2008-11-10 04:46:22 +0000	[diff] [blame]	2385	return;
				2386	}
				2387
Mon P Wang	c7849c2	2008-11-16 05:06:27 +0000	[diff] [blame]	2388	// Analyze the access pattern of the vector to see if we can extract
				2389	// two subvectors and do the shuffle. The analysis is done by calculating
				2390	// the range of elements the mask access on both vectors.
				2391	int MinRange[2] = { SrcNumElts+1, SrcNumElts+1};
				2392	int MaxRange[2] = {-1, -1};
				2393
				2394	for (int i = 0; i != MaskNumElts; ++i) {
Mon P Wang	aeb06d2	2008-11-10 04:46:22 +0000	[diff] [blame]	2395	SDValue Arg = Mask.getOperand(i);
				2396	if (Arg.getOpcode() != ISD::UNDEF) {
				2397	assert(isa<ConstantSDNode>(Arg) && "Invalid VECTOR_SHUFFLE mask!");
Mon P Wang	c7849c2	2008-11-16 05:06:27 +0000	[diff] [blame]	2398	int Idx = cast<ConstantSDNode>(Arg)->getZExtValue();
				2399	int Input = 0;
				2400	if (Idx >= SrcNumElts) {
				2401	Input = 1;
				2402	Idx -= SrcNumElts;
				2403	}
				2404	if (Idx > MaxRange[Input])
				2405	MaxRange[Input] = Idx;
				2406	if (Idx < MinRange[Input])
				2407	MinRange[Input] = Idx;
Mon P Wang	aeb06d2	2008-11-10 04:46:22 +0000	[diff] [blame]	2408	}
				2409	}
Mon P Wang	aeb06d2	2008-11-10 04:46:22 +0000	[diff] [blame]	2410
Mon P Wang	c7849c2	2008-11-16 05:06:27 +0000	[diff] [blame]	2411	// Check if the access is smaller than the vector size and can we find
				2412	// a reasonable extract index.
Mon P Wang	230e4fa	2008-11-21 04:25:21 +0000	[diff] [blame]	2413	int RangeUse[2] = { 2, 2 }; // 0 = Unused, 1 = Extract, 2 = Can not Extract.
Mon P Wang	c7849c2	2008-11-16 05:06:27 +0000	[diff] [blame]	2414	int StartIdx[2]; // StartIdx to extract from
				2415	for (int Input=0; Input < 2; ++Input) {
				2416	if (MinRange[Input] == SrcNumElts+1 && MaxRange[Input] == -1) {
				2417	RangeUse[Input] = 0; // Unused
				2418	StartIdx[Input] = 0;
				2419	} else if (MaxRange[Input] - MinRange[Input] < MaskNumElts) {
				2420	// Fits within range but we should see if we can find a good
Mon P Wang	230e4fa	2008-11-21 04:25:21 +0000	[diff] [blame]	2421	// start index that is a multiple of the mask length.
Mon P Wang	c7849c2	2008-11-16 05:06:27 +0000	[diff] [blame]	2422	if (MaxRange[Input] < MaskNumElts) {
				2423	RangeUse[Input] = 1; // Extract from beginning of the vector
				2424	StartIdx[Input] = 0;
				2425	} else {
				2426	StartIdx[Input] = (MinRange[Input]/MaskNumElts)*MaskNumElts;
Mon P Wang	6cce3da	2008-11-23 04:35:05 +0000	[diff] [blame]	2427	if (MaxRange[Input] - StartIdx[Input] < MaskNumElts &&
				2428	StartIdx[Input] + MaskNumElts < SrcNumElts)
Mon P Wang	c7849c2	2008-11-16 05:06:27 +0000	[diff] [blame]	2429	RangeUse[Input] = 1; // Extract from a multiple of the mask length.
Mon P Wang	c7849c2	2008-11-16 05:06:27 +0000	[diff] [blame]	2430	}
Mon P Wang	230e4fa	2008-11-21 04:25:21 +0000	[diff] [blame]	2431	}
Mon P Wang	c7849c2	2008-11-16 05:06:27 +0000	[diff] [blame]	2432	}
				2433
				2434	if (RangeUse[0] == 0 && RangeUse[0] == 0) {
				2435	setValue(&I, DAG.getNode(ISD::UNDEF, VT)); // Vectors are not used.
				2436	return;
				2437	}
				2438	else if (RangeUse[0] < 2 && RangeUse[1] < 2) {
				2439	// Extract appropriate subvector and generate a vector shuffle
				2440	for (int Input=0; Input < 2; ++Input) {
Mon P Wang	230e4fa	2008-11-21 04:25:21 +0000	[diff] [blame]	2441	SDValue& Src = Input == 0 ? Src1 : Src2;
Mon P Wang	c7849c2	2008-11-16 05:06:27 +0000	[diff] [blame]	2442	if (RangeUse[Input] == 0) {
Mon P Wang	230e4fa	2008-11-21 04:25:21 +0000	[diff] [blame]	2443	Src = DAG.getNode(ISD::UNDEF, VT);
Mon P Wang	c7849c2	2008-11-16 05:06:27 +0000	[diff] [blame]	2444	} else {
Mon P Wang	230e4fa	2008-11-21 04:25:21 +0000	[diff] [blame]	2445	Src = DAG.getNode(ISD::EXTRACT_SUBVECTOR, VT, Src,
				2446	DAG.getIntPtrConstant(StartIdx[Input]));
Mon P Wang	c7849c2	2008-11-16 05:06:27 +0000	[diff] [blame]	2447	}
Mon P Wang	aeb06d2	2008-11-10 04:46:22 +0000	[diff] [blame]	2448	}
Mon P Wang	c7849c2	2008-11-16 05:06:27 +0000	[diff] [blame]	2449	// Calculate new mask.
				2450	SmallVector<SDValue, 8> MappedOps;
				2451	for (int i = 0; i != MaskNumElts; ++i) {
				2452	SDValue Arg = Mask.getOperand(i);
				2453	if (Arg.getOpcode() == ISD::UNDEF) {
				2454	MappedOps.push_back(Arg);
				2455	} else {
				2456	int Idx = cast<ConstantSDNode>(Arg)->getZExtValue();
				2457	if (Idx < SrcNumElts)
				2458	MappedOps.push_back(DAG.getConstant(Idx - StartIdx[0], MaskEltVT));
				2459	else {
				2460	Idx = Idx - SrcNumElts - StartIdx[1] + MaskNumElts;
				2461	MappedOps.push_back(DAG.getConstant(Idx, MaskEltVT));
				2462	}
				2463	}
				2464	}
				2465	Mask = DAG.getNode(ISD::BUILD_VECTOR, Mask.getValueType(),
				2466	&MappedOps[0], MappedOps.size());
Mon P Wang	230e4fa	2008-11-21 04:25:21 +0000	[diff] [blame]	2467	setValue(&I, DAG.getNode(ISD::VECTOR_SHUFFLE, VT, Src1, Src2, Mask));
Mon P Wang	c7849c2	2008-11-16 05:06:27 +0000	[diff] [blame]	2468	return;
Mon P Wang	aeb06d2	2008-11-10 04:46:22 +0000	[diff] [blame]	2469	}
				2470	}
				2471
Mon P Wang	c7849c2	2008-11-16 05:06:27 +0000	[diff] [blame]	2472	// We can't use either concat vectors or extract subvectors so fall back to
				2473	// replacing the shuffle with extract and build vector.
				2474	// to insert and build vector.
Mon P Wang	aeb06d2	2008-11-10 04:46:22 +0000	[diff] [blame]	2475	MVT EltVT = VT.getVectorElementType();
				2476	MVT PtrVT = TLI.getPointerTy();
				2477	SmallVector<SDValue,8> Ops;
Mon P Wang	c7849c2	2008-11-16 05:06:27 +0000	[diff] [blame]	2478	for (int i = 0; i != MaskNumElts; ++i) {
Mon P Wang	aeb06d2	2008-11-10 04:46:22 +0000	[diff] [blame]	2479	SDValue Arg = Mask.getOperand(i);
				2480	if (Arg.getOpcode() == ISD::UNDEF) {
				2481	Ops.push_back(DAG.getNode(ISD::UNDEF, EltVT));
				2482	} else {
				2483	assert(isa<ConstantSDNode>(Arg) && "Invalid VECTOR_SHUFFLE mask!");
Mon P Wang	c7849c2	2008-11-16 05:06:27 +0000	[diff] [blame]	2484	int Idx = cast<ConstantSDNode>(Arg)->getZExtValue();
				2485	if (Idx < SrcNumElts)
Mon P Wang	230e4fa	2008-11-21 04:25:21 +0000	[diff] [blame]	2486	Ops.push_back(DAG.getNode(ISD::EXTRACT_VECTOR_ELT, EltVT, Src1,
Mon P Wang	aeb06d2	2008-11-10 04:46:22 +0000	[diff] [blame]	2487	DAG.getConstant(Idx, PtrVT)));
				2488	else
Mon P Wang	230e4fa	2008-11-21 04:25:21 +0000	[diff] [blame]	2489	Ops.push_back(DAG.getNode(ISD::EXTRACT_VECTOR_ELT, EltVT, Src2,
Mon P Wang	c7849c2	2008-11-16 05:06:27 +0000	[diff] [blame]	2490	DAG.getConstant(Idx - SrcNumElts, PtrVT)));
Mon P Wang	aeb06d2	2008-11-10 04:46:22 +0000	[diff] [blame]	2491	}
				2492	}
				2493	setValue(&I, DAG.getNode(ISD::BUILD_VECTOR, VT, &Ops[0], Ops.size()));
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	2494	}
				2495
				2496	void SelectionDAGLowering::visitInsertValue(InsertValueInst &I) {
				2497	const Value *Op0 = I.getOperand(0);
				2498	const Value *Op1 = I.getOperand(1);
				2499	const Type *AggTy = I.getType();
				2500	const Type *ValTy = Op1->getType();
				2501	bool IntoUndef = isa<UndefValue>(Op0);
				2502	bool FromUndef = isa<UndefValue>(Op1);
				2503
				2504	unsigned LinearIndex = ComputeLinearIndex(TLI, AggTy,
				2505	I.idx_begin(), I.idx_end());
				2506
				2507	SmallVector<MVT, 4> AggValueVTs;
				2508	ComputeValueVTs(TLI, AggTy, AggValueVTs);
				2509	SmallVector<MVT, 4> ValValueVTs;
				2510	ComputeValueVTs(TLI, ValTy, ValValueVTs);
				2511
				2512	unsigned NumAggValues = AggValueVTs.size();
				2513	unsigned NumValValues = ValValueVTs.size();
				2514	SmallVector<SDValue, 4> Values(NumAggValues);
				2515
				2516	SDValue Agg = getValue(Op0);
				2517	SDValue Val = getValue(Op1);
				2518	unsigned i = 0;
				2519	// Copy the beginning value(s) from the original aggregate.
				2520	for (; i != LinearIndex; ++i)
				2521	Values[i] = IntoUndef ? DAG.getNode(ISD::UNDEF, AggValueVTs[i]) :
				2522	SDValue(Agg.getNode(), Agg.getResNo() + i);
				2523	// Copy values from the inserted value(s).
				2524	for (; i != LinearIndex + NumValValues; ++i)
				2525	Values[i] = FromUndef ? DAG.getNode(ISD::UNDEF, AggValueVTs[i]) :
				2526	SDValue(Val.getNode(), Val.getResNo() + i - LinearIndex);
				2527	// Copy remaining value(s) from the original aggregate.
				2528	for (; i != NumAggValues; ++i)
				2529	Values[i] = IntoUndef ? DAG.getNode(ISD::UNDEF, AggValueVTs[i]) :
				2530	SDValue(Agg.getNode(), Agg.getResNo() + i);
				2531
Duncan Sands	aaffa05	2008-12-01 11:41:29 +0000	[diff] [blame]	2532	setValue(&I, DAG.getNode(ISD::MERGE_VALUES,
				2533	DAG.getVTList(&AggValueVTs[0], NumAggValues),
				2534	&Values[0], NumAggValues));
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	2535	}
				2536
				2537	void SelectionDAGLowering::visitExtractValue(ExtractValueInst &I) {
				2538	const Value *Op0 = I.getOperand(0);
				2539	const Type *AggTy = Op0->getType();
				2540	const Type *ValTy = I.getType();
				2541	bool OutOfUndef = isa<UndefValue>(Op0);
				2542
				2543	unsigned LinearIndex = ComputeLinearIndex(TLI, AggTy,
				2544	I.idx_begin(), I.idx_end());
				2545
				2546	SmallVector<MVT, 4> ValValueVTs;
				2547	ComputeValueVTs(TLI, ValTy, ValValueVTs);
				2548
				2549	unsigned NumValValues = ValValueVTs.size();
				2550	SmallVector<SDValue, 4> Values(NumValValues);
				2551
				2552	SDValue Agg = getValue(Op0);
				2553	// Copy out the selected value(s).
				2554	for (unsigned i = LinearIndex; i != LinearIndex + NumValValues; ++i)
				2555	Values[i - LinearIndex] =
Bill Wendling	f0a2d0c	2008-11-20 07:24:30 +0000	[diff] [blame]	2556	OutOfUndef ?
				2557	DAG.getNode(ISD::UNDEF,
				2558	Agg.getNode()->getValueType(Agg.getResNo() + i)) :
				2559	SDValue(Agg.getNode(), Agg.getResNo() + i);
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	2560
Duncan Sands	aaffa05	2008-12-01 11:41:29 +0000	[diff] [blame]	2561	setValue(&I, DAG.getNode(ISD::MERGE_VALUES,
				2562	DAG.getVTList(&ValValueVTs[0], NumValValues),
				2563	&Values[0], NumValValues));
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	2564	}
				2565
				2566
				2567	void SelectionDAGLowering::visitGetElementPtr(User &I) {
				2568	SDValue N = getValue(I.getOperand(0));
				2569	const Type *Ty = I.getOperand(0)->getType();
				2570
				2571	for (GetElementPtrInst::op_iterator OI = I.op_begin()+1, E = I.op_end();
				2572	OI != E; ++OI) {
				2573	Value Idx = OI;
				2574	if (const StructType *StTy = dyn_cast<StructType>(Ty)) {
				2575	unsigned Field = cast<ConstantInt>(Idx)->getZExtValue();
				2576	if (Field) {
				2577	// N = N + Offset
				2578	uint64_t Offset = TD->getStructLayout(StTy)->getElementOffset(Field);
				2579	N = DAG.getNode(ISD::ADD, N.getValueType(), N,
				2580	DAG.getIntPtrConstant(Offset));
				2581	}
				2582	Ty = StTy->getElementType(Field);
				2583	} else {
				2584	Ty = cast<SequentialType>(Ty)->getElementType();
				2585
				2586	// If this is a constant subscript, handle it quickly.
				2587	if (ConstantInt *CI = dyn_cast<ConstantInt>(Idx)) {
				2588	if (CI->getZExtValue() == 0) continue;
				2589	uint64_t Offs =
				2590	TD->getABITypeSize(Ty)*cast<ConstantInt>(CI)->getSExtValue();
				2591	N = DAG.getNode(ISD::ADD, N.getValueType(), N,
				2592	DAG.getIntPtrConstant(Offs));
				2593	continue;
				2594	}
				2595
				2596	// N = N + Idx * ElementSize;
				2597	uint64_t ElementSize = TD->getABITypeSize(Ty);
				2598	SDValue IdxN = getValue(Idx);
				2599
				2600	// If the index is smaller or larger than intptr_t, truncate or extend
				2601	// it.
				2602	if (IdxN.getValueType().bitsLT(N.getValueType()))
				2603	IdxN = DAG.getNode(ISD::SIGN_EXTEND, N.getValueType(), IdxN);
				2604	else if (IdxN.getValueType().bitsGT(N.getValueType()))
				2605	IdxN = DAG.getNode(ISD::TRUNCATE, N.getValueType(), IdxN);
				2606
				2607	// If this is a multiply by a power of two, turn it into a shl
				2608	// immediately. This is a very common case.
				2609	if (ElementSize != 1) {
				2610	if (isPowerOf2_64(ElementSize)) {
				2611	unsigned Amt = Log2_64(ElementSize);
				2612	IdxN = DAG.getNode(ISD::SHL, N.getValueType(), IdxN,
				2613	DAG.getConstant(Amt, TLI.getShiftAmountTy()));
				2614	} else {
				2615	SDValue Scale = DAG.getIntPtrConstant(ElementSize);
				2616	IdxN = DAG.getNode(ISD::MUL, N.getValueType(), IdxN, Scale);
				2617	}
				2618	}
				2619
				2620	N = DAG.getNode(ISD::ADD, N.getValueType(), N, IdxN);
				2621	}
				2622	}
				2623	setValue(&I, N);
				2624	}
				2625
				2626	void SelectionDAGLowering::visitAlloca(AllocaInst &I) {
				2627	// If this is a fixed sized alloca in the entry block of the function,
				2628	// allocate it statically on the stack.
				2629	if (FuncInfo.StaticAllocaMap.count(&I))
				2630	return; // getValue will auto-populate this.
				2631
				2632	const Type *Ty = I.getAllocatedType();
				2633	uint64_t TySize = TLI.getTargetData()->getABITypeSize(Ty);
				2634	unsigned Align =
				2635	std::max((unsigned)TLI.getTargetData()->getPrefTypeAlignment(Ty),
				2636	I.getAlignment());
				2637
				2638	SDValue AllocSize = getValue(I.getArraySize());
				2639	MVT IntPtr = TLI.getPointerTy();
				2640	if (IntPtr.bitsLT(AllocSize.getValueType()))
				2641	AllocSize = DAG.getNode(ISD::TRUNCATE, IntPtr, AllocSize);
				2642	else if (IntPtr.bitsGT(AllocSize.getValueType()))
				2643	AllocSize = DAG.getNode(ISD::ZERO_EXTEND, IntPtr, AllocSize);
				2644
				2645	AllocSize = DAG.getNode(ISD::MUL, IntPtr, AllocSize,
				2646	DAG.getIntPtrConstant(TySize));
				2647
				2648	// Handle alignment. If the requested alignment is less than or equal to
				2649	// the stack alignment, ignore it. If the size is greater than or equal to
				2650	// the stack alignment, we note this in the DYNAMIC_STACKALLOC node.
				2651	unsigned StackAlign =
				2652	TLI.getTargetMachine().getFrameInfo()->getStackAlignment();
				2653	if (Align <= StackAlign)
				2654	Align = 0;
				2655
				2656	// Round the size of the allocation up to the stack alignment size
				2657	// by add SA-1 to the size.
				2658	AllocSize = DAG.getNode(ISD::ADD, AllocSize.getValueType(), AllocSize,
				2659	DAG.getIntPtrConstant(StackAlign-1));
				2660	// Mask out the low bits for alignment purposes.
				2661	AllocSize = DAG.getNode(ISD::AND, AllocSize.getValueType(), AllocSize,
				2662	DAG.getIntPtrConstant(~(uint64_t)(StackAlign-1)));
				2663
				2664	SDValue Ops[] = { getRoot(), AllocSize, DAG.getIntPtrConstant(Align) };
				2665	const MVT *VTs = DAG.getNodeValueTypes(AllocSize.getValueType(),
				2666	MVT::Other);
				2667	SDValue DSA = DAG.getNode(ISD::DYNAMIC_STACKALLOC, VTs, 2, Ops, 3);
				2668	setValue(&I, DSA);
				2669	DAG.setRoot(DSA.getValue(1));
				2670
				2671	// Inform the Frame Information that we have just allocated a variable-sized
				2672	// object.
				2673	CurMBB->getParent()->getFrameInfo()->CreateVariableSizedObject();
				2674	}
				2675
				2676	void SelectionDAGLowering::visitLoad(LoadInst &I) {
				2677	const Value *SV = I.getOperand(0);
				2678	SDValue Ptr = getValue(SV);
				2679
				2680	const Type *Ty = I.getType();
				2681	bool isVolatile = I.isVolatile();
				2682	unsigned Alignment = I.getAlignment();
				2683
				2684	SmallVector<MVT, 4> ValueVTs;
				2685	SmallVector<uint64_t, 4> Offsets;
				2686	ComputeValueVTs(TLI, Ty, ValueVTs, &Offsets);
				2687	unsigned NumValues = ValueVTs.size();
				2688	if (NumValues == 0)
				2689	return;
				2690
				2691	SDValue Root;
				2692	bool ConstantMemory = false;
				2693	if (I.isVolatile())
				2694	// Serialize volatile loads with other side effects.
				2695	Root = getRoot();
				2696	else if (AA->pointsToConstantMemory(SV)) {
				2697	// Do not serialize (non-volatile) loads of constant memory with anything.
				2698	Root = DAG.getEntryNode();
				2699	ConstantMemory = true;
				2700	} else {
				2701	// Do not serialize non-volatile loads against each other.
				2702	Root = DAG.getRoot();
				2703	}
				2704
				2705	SmallVector<SDValue, 4> Values(NumValues);
				2706	SmallVector<SDValue, 4> Chains(NumValues);
				2707	MVT PtrVT = Ptr.getValueType();
				2708	for (unsigned i = 0; i != NumValues; ++i) {
				2709	SDValue L = DAG.getLoad(ValueVTs[i], Root,
				2710	DAG.getNode(ISD::ADD, PtrVT, Ptr,
				2711	DAG.getConstant(Offsets[i], PtrVT)),
				2712	SV, Offsets[i],
				2713	isVolatile, Alignment);
				2714	Values[i] = L;
				2715	Chains[i] = L.getValue(1);
				2716	}
				2717
				2718	if (!ConstantMemory) {
				2719	SDValue Chain = DAG.getNode(ISD::TokenFactor, MVT::Other,
				2720	&Chains[0], NumValues);
				2721	if (isVolatile)
				2722	DAG.setRoot(Chain);
				2723	else
				2724	PendingLoads.push_back(Chain);
				2725	}
				2726
Duncan Sands	aaffa05	2008-12-01 11:41:29 +0000	[diff] [blame]	2727	setValue(&I, DAG.getNode(ISD::MERGE_VALUES,
				2728	DAG.getVTList(&ValueVTs[0], NumValues),
				2729	&Values[0], NumValues));
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	2730	}
				2731
				2732
				2733	void SelectionDAGLowering::visitStore(StoreInst &I) {
				2734	Value *SrcV = I.getOperand(0);
				2735	Value *PtrV = I.getOperand(1);
				2736
				2737	SmallVector<MVT, 4> ValueVTs;
				2738	SmallVector<uint64_t, 4> Offsets;
				2739	ComputeValueVTs(TLI, SrcV->getType(), ValueVTs, &Offsets);
				2740	unsigned NumValues = ValueVTs.size();
				2741	if (NumValues == 0)
				2742	return;
				2743
				2744	// Get the lowered operands. Note that we do this after
				2745	// checking if NumResults is zero, because with zero results
				2746	// the operands won't have values in the map.
				2747	SDValue Src = getValue(SrcV);
				2748	SDValue Ptr = getValue(PtrV);
				2749
				2750	SDValue Root = getRoot();
				2751	SmallVector<SDValue, 4> Chains(NumValues);
				2752	MVT PtrVT = Ptr.getValueType();
				2753	bool isVolatile = I.isVolatile();
				2754	unsigned Alignment = I.getAlignment();
				2755	for (unsigned i = 0; i != NumValues; ++i)
				2756	Chains[i] = DAG.getStore(Root, SDValue(Src.getNode(), Src.getResNo() + i),
				2757	DAG.getNode(ISD::ADD, PtrVT, Ptr,
				2758	DAG.getConstant(Offsets[i], PtrVT)),
				2759	PtrV, Offsets[i],
				2760	isVolatile, Alignment);
				2761
				2762	DAG.setRoot(DAG.getNode(ISD::TokenFactor, MVT::Other, &Chains[0], NumValues));
				2763	}
				2764
				2765	/// visitTargetIntrinsic - Lower a call of a target intrinsic to an INTRINSIC
				2766	/// node.
				2767	void SelectionDAGLowering::visitTargetIntrinsic(CallInst &I,
				2768	unsigned Intrinsic) {
				2769	bool HasChain = !I.doesNotAccessMemory();
				2770	bool OnlyLoad = HasChain && I.onlyReadsMemory();
				2771
				2772	// Build the operand list.
				2773	SmallVector<SDValue, 8> Ops;
				2774	if (HasChain) { // If this intrinsic has side-effects, chainify it.
				2775	if (OnlyLoad) {
				2776	// We don't need to serialize loads against other loads.
				2777	Ops.push_back(DAG.getRoot());
				2778	} else {
				2779	Ops.push_back(getRoot());
				2780	}
				2781	}
Mon P Wang	3efcd4a	2008-11-01 20:24:53 +0000	[diff] [blame]	2782
				2783	// Info is set by getTgtMemInstrinsic
				2784	TargetLowering::IntrinsicInfo Info;
				2785	bool IsTgtIntrinsic = TLI.getTgtMemIntrinsic(Info, I, Intrinsic);
				2786
				2787	// Add the intrinsic ID as an integer operand if it's not a target intrinsic.
				2788	if (!IsTgtIntrinsic)
				2789	Ops.push_back(DAG.getConstant(Intrinsic, TLI.getPointerTy()));
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	2790
				2791	// Add all operands of the call to the operand list.
				2792	for (unsigned i = 1, e = I.getNumOperands(); i != e; ++i) {
				2793	SDValue Op = getValue(I.getOperand(i));
				2794	assert(TLI.isTypeLegal(Op.getValueType()) &&
				2795	"Intrinsic uses a non-legal type?");
				2796	Ops.push_back(Op);
				2797	}
				2798
				2799	std::vector<MVT> VTs;
				2800	if (I.getType() != Type::VoidTy) {
				2801	MVT VT = TLI.getValueType(I.getType());
				2802	if (VT.isVector()) {
				2803	const VectorType *DestTy = cast<VectorType>(I.getType());
				2804	MVT EltVT = TLI.getValueType(DestTy->getElementType());
				2805
				2806	VT = MVT::getVectorVT(EltVT, DestTy->getNumElements());
				2807	assert(VT != MVT::Other && "Intrinsic uses a non-legal type?");
				2808	}
				2809
				2810	assert(TLI.isTypeLegal(VT) && "Intrinsic uses a non-legal type?");
				2811	VTs.push_back(VT);
				2812	}
				2813	if (HasChain)
				2814	VTs.push_back(MVT::Other);
				2815
				2816	const MVT *VTList = DAG.getNodeValueTypes(VTs);
				2817
				2818	// Create the node.
				2819	SDValue Result;
Mon P Wang	3efcd4a	2008-11-01 20:24:53 +0000	[diff] [blame]	2820	if (IsTgtIntrinsic) {
				2821	// This is target intrinsic that touches memory
				2822	Result = DAG.getMemIntrinsicNode(Info.opc, VTList, VTs.size(),
				2823	&Ops[0], Ops.size(),
				2824	Info.memVT, Info.ptrVal, Info.offset,
				2825	Info.align, Info.vol,
				2826	Info.readMem, Info.writeMem);
				2827	}
				2828	else if (!HasChain)
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	2829	Result = DAG.getNode(ISD::INTRINSIC_WO_CHAIN, VTList, VTs.size(),
				2830	&Ops[0], Ops.size());
				2831	else if (I.getType() != Type::VoidTy)
				2832	Result = DAG.getNode(ISD::INTRINSIC_W_CHAIN, VTList, VTs.size(),
				2833	&Ops[0], Ops.size());
				2834	else
				2835	Result = DAG.getNode(ISD::INTRINSIC_VOID, VTList, VTs.size(),
				2836	&Ops[0], Ops.size());
				2837
				2838	if (HasChain) {
				2839	SDValue Chain = Result.getValue(Result.getNode()->getNumValues()-1);
				2840	if (OnlyLoad)
				2841	PendingLoads.push_back(Chain);
				2842	else
				2843	DAG.setRoot(Chain);
				2844	}
				2845	if (I.getType() != Type::VoidTy) {
				2846	if (const VectorType *PTy = dyn_cast<VectorType>(I.getType())) {
				2847	MVT VT = TLI.getValueType(PTy);
				2848	Result = DAG.getNode(ISD::BIT_CONVERT, VT, Result);
				2849	}
				2850	setValue(&I, Result);
				2851	}
				2852	}
				2853
				2854	/// ExtractTypeInfo - Returns the type info, possibly bitcast, encoded in V.
				2855	static GlobalVariable ExtractTypeInfo(Value V) {
				2856	V = V->stripPointerCasts();
				2857	GlobalVariable *GV = dyn_cast<GlobalVariable>(V);
				2858	assert ((GV \|\| isa<ConstantPointerNull>(V)) &&
				2859	"TypeInfo must be a global variable or NULL");
				2860	return GV;
				2861	}
				2862
				2863	namespace llvm {
				2864
				2865	/// AddCatchInfo - Extract the personality and type infos from an eh.selector
				2866	/// call, and add them to the specified machine basic block.
				2867	void AddCatchInfo(CallInst &I, MachineModuleInfo *MMI,
				2868	MachineBasicBlock *MBB) {
				2869	// Inform the MachineModuleInfo of the personality for this landing pad.
				2870	ConstantExpr *CE = cast<ConstantExpr>(I.getOperand(2));
				2871	assert(CE->getOpcode() == Instruction::BitCast &&
				2872	isa<Function>(CE->getOperand(0)) &&
				2873	"Personality should be a function");
				2874	MMI->addPersonality(MBB, cast<Function>(CE->getOperand(0)));
				2875
				2876	// Gather all the type infos for this landing pad and pass them along to
				2877	// MachineModuleInfo.
				2878	std::vector<GlobalVariable *> TyInfo;
				2879	unsigned N = I.getNumOperands();
				2880
				2881	for (unsigned i = N - 1; i > 2; --i) {
				2882	if (ConstantInt *CI = dyn_cast<ConstantInt>(I.getOperand(i))) {
				2883	unsigned FilterLength = CI->getZExtValue();
				2884	unsigned FirstCatch = i + FilterLength + !FilterLength;
				2885	assert (FirstCatch <= N && "Invalid filter length");
				2886
				2887	if (FirstCatch < N) {
				2888	TyInfo.reserve(N - FirstCatch);
				2889	for (unsigned j = FirstCatch; j < N; ++j)
				2890	TyInfo.push_back(ExtractTypeInfo(I.getOperand(j)));
				2891	MMI->addCatchTypeInfo(MBB, TyInfo);
				2892	TyInfo.clear();
				2893	}
				2894
				2895	if (!FilterLength) {
				2896	// Cleanup.
				2897	MMI->addCleanup(MBB);
				2898	} else {
				2899	// Filter.
				2900	TyInfo.reserve(FilterLength - 1);
				2901	for (unsigned j = i + 1; j < FirstCatch; ++j)
				2902	TyInfo.push_back(ExtractTypeInfo(I.getOperand(j)));
				2903	MMI->addFilterTypeInfo(MBB, TyInfo);
				2904	TyInfo.clear();
				2905	}
				2906
				2907	N = i;
				2908	}
				2909	}
				2910
				2911	if (N > 3) {
				2912	TyInfo.reserve(N - 3);
				2913	for (unsigned j = 3; j < N; ++j)
				2914	TyInfo.push_back(ExtractTypeInfo(I.getOperand(j)));
				2915	MMI->addCatchTypeInfo(MBB, TyInfo);
				2916	}
				2917	}
				2918
				2919	}
				2920
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	2921	/// GetSignificand - Get the significand and build it into a floating-point
				2922	/// number with exponent of 1:
				2923	///
				2924	/// Op = (Op & 0x007fffff) \| 0x3f800000;
				2925	///
				2926	/// where Op is the hexidecimal representation of floating point value.
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	2927	static SDValue
				2928	GetSignificand(SelectionDAG &DAG, SDValue Op) {
				2929	SDValue t1 = DAG.getNode(ISD::AND, MVT::i32, Op,
				2930	DAG.getConstant(0x007fffff, MVT::i32));
				2931	SDValue t2 = DAG.getNode(ISD::OR, MVT::i32, t1,
				2932	DAG.getConstant(0x3f800000, MVT::i32));
				2933	return DAG.getNode(ISD::BIT_CONVERT, MVT::f32, t2);
				2934	}
				2935
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	2936	/// GetExponent - Get the exponent:
				2937	///
				2938	/// (float)((Op1 >> 23) - 127);
				2939	///
				2940	/// where Op is the hexidecimal representation of floating point value.
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	2941	static SDValue
				2942	GetExponent(SelectionDAG &DAG, SDValue Op) {
Bill Wendling	fc2508e	2008-09-10 06:26:10 +0000	[diff] [blame]	2943	SDValue t1 = DAG.getNode(ISD::SRL, MVT::i32, Op,
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	2944	DAG.getConstant(23, MVT::i32));
Bill Wendling	fc2508e	2008-09-10 06:26:10 +0000	[diff] [blame]	2945	SDValue t2 = DAG.getNode(ISD::SUB, MVT::i32, t1,
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	2946	DAG.getConstant(127, MVT::i32));
Bill Wendling	fc2508e	2008-09-10 06:26:10 +0000	[diff] [blame]	2947	return DAG.getNode(ISD::UINT_TO_FP, MVT::f32, t2);
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	2948	}
				2949
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	2950	/// getF32Constant - Get 32-bit floating point constant.
				2951	static SDValue
				2952	getF32Constant(SelectionDAG &DAG, unsigned Flt) {
				2953	return DAG.getConstantFP(APFloat(APInt(32, Flt)), MVT::f32);
				2954	}
				2955
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	2956	/// Inlined utility function to implement binary input atomic intrinsics for
				2957	/// visitIntrinsicCall: I is a call instruction
				2958	/// Op is the associated NodeType for I
				2959	const char *
				2960	SelectionDAGLowering::implVisitBinaryAtomic(CallInst& I, ISD::NodeType Op) {
				2961	SDValue Root = getRoot();
				2962	SDValue L = DAG.getAtomic(Op, Root,
Bill Wendling	2ce4e5c	2008-12-10 00:28:22 +0000	[diff] [blame]	2963	getValue(I.getOperand(1)),
				2964	getValue(I.getOperand(2)),
				2965	I.getOperand(1));
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	2966	setValue(&I, L);
				2967	DAG.setRoot(L.getValue(1));
				2968	return 0;
				2969	}
				2970
Bill Wendling	2ce4e5c	2008-12-10 00:28:22 +0000	[diff] [blame]	2971	// implVisitAluOverflow - Lower arithmetic overflow instrinsics.
Bill Wendling	74c3765	2008-12-09 22:08:41 +0000	[diff] [blame]	2972	const char *
				2973	SelectionDAGLowering::implVisitAluOverflow(CallInst &I, ISD::NodeType Op) {
Bill Wendling	2ce4e5c	2008-12-10 00:28:22 +0000	[diff] [blame]	2974	SDValue Op1 = getValue(I.getOperand(1));
				2975	SDValue Op2 = getValue(I.getOperand(2));
Bill Wendling	74c3765	2008-12-09 22:08:41 +0000	[diff] [blame]	2976
Bill Wendling	2ce4e5c	2008-12-10 00:28:22 +0000	[diff] [blame]	2977	MVT ValueVTs[] = { Op1.getValueType(), MVT::i1 };
				2978	SDValue Ops[] = { Op1, Op2 };
Bill Wendling	74c3765	2008-12-09 22:08:41 +0000	[diff] [blame]	2979
Bill Wendling	2ce4e5c	2008-12-10 00:28:22 +0000	[diff] [blame]	2980	SDValue Result = DAG.getNode(Op, DAG.getVTList(&ValueVTs[0], 2), &Ops[0], 2);
Bill Wendling	74c3765	2008-12-09 22:08:41 +0000	[diff] [blame]	2981
Bill Wendling	2ce4e5c	2008-12-10 00:28:22 +0000	[diff] [blame]	2982	setValue(&I, Result);
				2983	return 0;
				2984	}
Bill Wendling	74c3765	2008-12-09 22:08:41 +0000	[diff] [blame]	2985
Bill Wendling	b4ec283	2008-09-09 22:13:54 +0000	[diff] [blame]	2986	/// visitExp - Lower an exp intrinsic. Handles the special sequences for
				2987	/// limited-precision mode.
Dale Johannesen	59e577f	2008-09-05 18:38:42 +0000	[diff] [blame]	2988	void
				2989	SelectionDAGLowering::visitExp(CallInst &I) {
				2990	SDValue result;
Bill Wendling	b4ec283	2008-09-09 22:13:54 +0000	[diff] [blame]	2991
				2992	if (getValue(I.getOperand(1)).getValueType() == MVT::f32 &&
				2993	LimitFloatPrecision > 0 && LimitFloatPrecision <= 18) {
				2994	SDValue Op = getValue(I.getOperand(1));
				2995
				2996	// Put the exponent in the right bit position for later addition to the
				2997	// final result:
				2998	//
				2999	// #define LOG2OFe 1.4426950f
				3000	// IntegerPartOfX = ((int32_t)(X * LOG2OFe));
				3001	SDValue t0 = DAG.getNode(ISD::FMUL, MVT::f32, Op,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3002	getF32Constant(DAG, 0x3fb8aa3b));
Bill Wendling	b4ec283	2008-09-09 22:13:54 +0000	[diff] [blame]	3003	SDValue IntegerPartOfX = DAG.getNode(ISD::FP_TO_SINT, MVT::i32, t0);
				3004
				3005	// FractionalPartOfX = (X * LOG2OFe) - (float)IntegerPartOfX;
				3006	SDValue t1 = DAG.getNode(ISD::SINT_TO_FP, MVT::f32, IntegerPartOfX);
				3007	SDValue X = DAG.getNode(ISD::FSUB, MVT::f32, t0, t1);
				3008
				3009	// IntegerPartOfX <<= 23;
				3010	IntegerPartOfX = DAG.getNode(ISD::SHL, MVT::i32, IntegerPartOfX,
				3011	DAG.getConstant(23, MVT::i32));
				3012
				3013	if (LimitFloatPrecision <= 6) {
				3014	// For floating-point precision of 6:
				3015	//
				3016	// TwoToFractionalPartOfX =
				3017	// 0.997535578f +
				3018	// (0.735607626f + 0.252464424f * x) * x;
				3019	//
				3020	// error 0.0144103317, which is 6 bits
				3021	SDValue t2 = DAG.getNode(ISD::FMUL, MVT::f32, X,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3022	getF32Constant(DAG, 0x3e814304));
Bill Wendling	b4ec283	2008-09-09 22:13:54 +0000	[diff] [blame]	3023	SDValue t3 = DAG.getNode(ISD::FADD, MVT::f32, t2,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3024	getF32Constant(DAG, 0x3f3c50c8));
Bill Wendling	b4ec283	2008-09-09 22:13:54 +0000	[diff] [blame]	3025	SDValue t4 = DAG.getNode(ISD::FMUL, MVT::f32, t3, X);
				3026	SDValue t5 = DAG.getNode(ISD::FADD, MVT::f32, t4,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3027	getF32Constant(DAG, 0x3f7f5e7e));
Bill Wendling	b4ec283	2008-09-09 22:13:54 +0000	[diff] [blame]	3028	SDValue TwoToFracPartOfX = DAG.getNode(ISD::BIT_CONVERT, MVT::i32, t5);
				3029
				3030	// Add the exponent into the result in integer domain.
				3031	SDValue t6 = DAG.getNode(ISD::ADD, MVT::i32,
				3032	TwoToFracPartOfX, IntegerPartOfX);
				3033
				3034	result = DAG.getNode(ISD::BIT_CONVERT, MVT::f32, t6);
				3035	} else if (LimitFloatPrecision > 6 && LimitFloatPrecision <= 12) {
				3036	// For floating-point precision of 12:
				3037	//
				3038	// TwoToFractionalPartOfX =
				3039	// 0.999892986f +
				3040	// (0.696457318f +
				3041	// (0.224338339f + 0.792043434e-1f * x) * x) * x;
				3042	//
				3043	// 0.000107046256 error, which is 13 to 14 bits
				3044	SDValue t2 = DAG.getNode(ISD::FMUL, MVT::f32, X,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3045	getF32Constant(DAG, 0x3da235e3));
Bill Wendling	b4ec283	2008-09-09 22:13:54 +0000	[diff] [blame]	3046	SDValue t3 = DAG.getNode(ISD::FADD, MVT::f32, t2,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3047	getF32Constant(DAG, 0x3e65b8f3));
Bill Wendling	b4ec283	2008-09-09 22:13:54 +0000	[diff] [blame]	3048	SDValue t4 = DAG.getNode(ISD::FMUL, MVT::f32, t3, X);
				3049	SDValue t5 = DAG.getNode(ISD::FADD, MVT::f32, t4,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3050	getF32Constant(DAG, 0x3f324b07));
Bill Wendling	b4ec283	2008-09-09 22:13:54 +0000	[diff] [blame]	3051	SDValue t6 = DAG.getNode(ISD::FMUL, MVT::f32, t5, X);
				3052	SDValue t7 = DAG.getNode(ISD::FADD, MVT::f32, t6,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3053	getF32Constant(DAG, 0x3f7ff8fd));
Bill Wendling	b4ec283	2008-09-09 22:13:54 +0000	[diff] [blame]	3054	SDValue TwoToFracPartOfX = DAG.getNode(ISD::BIT_CONVERT, MVT::i32, t7);
				3055
				3056	// Add the exponent into the result in integer domain.
				3057	SDValue t8 = DAG.getNode(ISD::ADD, MVT::i32,
				3058	TwoToFracPartOfX, IntegerPartOfX);
				3059
				3060	result = DAG.getNode(ISD::BIT_CONVERT, MVT::f32, t8);
				3061	} else { // LimitFloatPrecision > 12 && LimitFloatPrecision <= 18
				3062	// For floating-point precision of 18:
				3063	//
				3064	// TwoToFractionalPartOfX =
				3065	// 0.999999982f +
				3066	// (0.693148872f +
				3067	// (0.240227044f +
				3068	// (0.554906021e-1f +
				3069	// (0.961591928e-2f +
				3070	// (0.136028312e-2f + 0.157059148e-3f x)x)x)x)x)x;
				3071	//
				3072	// error 2.47208000*10^(-7), which is better than 18 bits
				3073	SDValue t2 = DAG.getNode(ISD::FMUL, MVT::f32, X,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3074	getF32Constant(DAG, 0x3924b03e));
Bill Wendling	b4ec283	2008-09-09 22:13:54 +0000	[diff] [blame]	3075	SDValue t3 = DAG.getNode(ISD::FADD, MVT::f32, t2,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3076	getF32Constant(DAG, 0x3ab24b87));
Bill Wendling	b4ec283	2008-09-09 22:13:54 +0000	[diff] [blame]	3077	SDValue t4 = DAG.getNode(ISD::FMUL, MVT::f32, t3, X);
				3078	SDValue t5 = DAG.getNode(ISD::FADD, MVT::f32, t4,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3079	getF32Constant(DAG, 0x3c1d8c17));
Bill Wendling	b4ec283	2008-09-09 22:13:54 +0000	[diff] [blame]	3080	SDValue t6 = DAG.getNode(ISD::FMUL, MVT::f32, t5, X);
				3081	SDValue t7 = DAG.getNode(ISD::FADD, MVT::f32, t6,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3082	getF32Constant(DAG, 0x3d634a1d));
Bill Wendling	b4ec283	2008-09-09 22:13:54 +0000	[diff] [blame]	3083	SDValue t8 = DAG.getNode(ISD::FMUL, MVT::f32, t7, X);
				3084	SDValue t9 = DAG.getNode(ISD::FADD, MVT::f32, t8,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3085	getF32Constant(DAG, 0x3e75fe14));
Bill Wendling	b4ec283	2008-09-09 22:13:54 +0000	[diff] [blame]	3086	SDValue t10 = DAG.getNode(ISD::FMUL, MVT::f32, t9, X);
				3087	SDValue t11 = DAG.getNode(ISD::FADD, MVT::f32, t10,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3088	getF32Constant(DAG, 0x3f317234));
Bill Wendling	b4ec283	2008-09-09 22:13:54 +0000	[diff] [blame]	3089	SDValue t12 = DAG.getNode(ISD::FMUL, MVT::f32, t11, X);
				3090	SDValue t13 = DAG.getNode(ISD::FADD, MVT::f32, t12,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3091	getF32Constant(DAG, 0x3f800000));
Bill Wendling	b4ec283	2008-09-09 22:13:54 +0000	[diff] [blame]	3092	SDValue TwoToFracPartOfX = DAG.getNode(ISD::BIT_CONVERT, MVT::i32, t13);
				3093
				3094	// Add the exponent into the result in integer domain.
				3095	SDValue t14 = DAG.getNode(ISD::ADD, MVT::i32,
				3096	TwoToFracPartOfX, IntegerPartOfX);
				3097
				3098	result = DAG.getNode(ISD::BIT_CONVERT, MVT::f32, t14);
				3099	}
				3100	} else {
				3101	// No special expansion.
				3102	result = DAG.getNode(ISD::FEXP,
				3103	getValue(I.getOperand(1)).getValueType(),
				3104	getValue(I.getOperand(1)));
				3105	}
				3106
Dale Johannesen	59e577f	2008-09-05 18:38:42 +0000	[diff] [blame]	3107	setValue(&I, result);
				3108	}
				3109
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	3110	/// visitLog - Lower a log intrinsic. Handles the special sequences for
				3111	/// limited-precision mode.
Dale Johannesen	59e577f	2008-09-05 18:38:42 +0000	[diff] [blame]	3112	void
				3113	SelectionDAGLowering::visitLog(CallInst &I) {
				3114	SDValue result;
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	3115
				3116	if (getValue(I.getOperand(1)).getValueType() == MVT::f32 &&
				3117	LimitFloatPrecision > 0 && LimitFloatPrecision <= 18) {
				3118	SDValue Op = getValue(I.getOperand(1));
				3119	SDValue Op1 = DAG.getNode(ISD::BIT_CONVERT, MVT::i32, Op);
				3120
				3121	// Scale the exponent by log(2) [0.69314718f].
				3122	SDValue Exp = GetExponent(DAG, Op1);
				3123	SDValue LogOfExponent = DAG.getNode(ISD::FMUL, MVT::f32, Exp,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3124	getF32Constant(DAG, 0x3f317218));
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	3125
				3126	// Get the significand and build it into a floating-point number with
				3127	// exponent of 1.
				3128	SDValue X = GetSignificand(DAG, Op1);
				3129
				3130	if (LimitFloatPrecision <= 6) {
				3131	// For floating-point precision of 6:
				3132	//
				3133	// LogofMantissa =
				3134	// -1.1609546f +
				3135	// (1.4034025f - 0.23903021f * x) * x;
				3136	//
				3137	// error 0.0034276066, which is better than 8 bits
				3138	SDValue t0 = DAG.getNode(ISD::FMUL, MVT::f32, X,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3139	getF32Constant(DAG, 0xbe74c456));
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	3140	SDValue t1 = DAG.getNode(ISD::FADD, MVT::f32, t0,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3141	getF32Constant(DAG, 0x3fb3a2b1));
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	3142	SDValue t2 = DAG.getNode(ISD::FMUL, MVT::f32, t1, X);
				3143	SDValue LogOfMantissa = DAG.getNode(ISD::FSUB, MVT::f32, t2,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3144	getF32Constant(DAG, 0x3f949a29));
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	3145
				3146	result = DAG.getNode(ISD::FADD, MVT::f32, LogOfExponent, LogOfMantissa);
				3147	} else if (LimitFloatPrecision > 6 && LimitFloatPrecision <= 12) {
				3148	// For floating-point precision of 12:
				3149	//
				3150	// LogOfMantissa =
				3151	// -1.7417939f +
				3152	// (2.8212026f +
				3153	// (-1.4699568f +
				3154	// (0.44717955f - 0.56570851e-1f * x) * x) * x) * x;
				3155	//
				3156	// error 0.000061011436, which is 14 bits
				3157	SDValue t0 = DAG.getNode(ISD::FMUL, MVT::f32, X,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3158	getF32Constant(DAG, 0xbd67b6d6));
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	3159	SDValue t1 = DAG.getNode(ISD::FADD, MVT::f32, t0,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3160	getF32Constant(DAG, 0x3ee4f4b8));
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	3161	SDValue t2 = DAG.getNode(ISD::FMUL, MVT::f32, t1, X);
				3162	SDValue t3 = DAG.getNode(ISD::FSUB, MVT::f32, t2,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3163	getF32Constant(DAG, 0x3fbc278b));
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	3164	SDValue t4 = DAG.getNode(ISD::FMUL, MVT::f32, t3, X);
				3165	SDValue t5 = DAG.getNode(ISD::FADD, MVT::f32, t4,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3166	getF32Constant(DAG, 0x40348e95));
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	3167	SDValue t6 = DAG.getNode(ISD::FMUL, MVT::f32, t5, X);
				3168	SDValue LogOfMantissa = DAG.getNode(ISD::FSUB, MVT::f32, t6,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3169	getF32Constant(DAG, 0x3fdef31a));
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	3170
				3171	result = DAG.getNode(ISD::FADD, MVT::f32, LogOfExponent, LogOfMantissa);
				3172	} else { // LimitFloatPrecision > 12 && LimitFloatPrecision <= 18
				3173	// For floating-point precision of 18:
				3174	//
				3175	// LogOfMantissa =
				3176	// -2.1072184f +
				3177	// (4.2372794f +
				3178	// (-3.7029485f +
				3179	// (2.2781945f +
				3180	// (-0.87823314f +
				3181	// (0.19073739f - 0.17809712e-1f * x) * x) * x) * x) * x)*x;
				3182	//
				3183	// error 0.0000023660568, which is better than 18 bits
				3184	SDValue t0 = DAG.getNode(ISD::FMUL, MVT::f32, X,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3185	getF32Constant(DAG, 0xbc91e5ac));
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	3186	SDValue t1 = DAG.getNode(ISD::FADD, MVT::f32, t0,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3187	getF32Constant(DAG, 0x3e4350aa));
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	3188	SDValue t2 = DAG.getNode(ISD::FMUL, MVT::f32, t1, X);
				3189	SDValue t3 = DAG.getNode(ISD::FSUB, MVT::f32, t2,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3190	getF32Constant(DAG, 0x3f60d3e3));
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	3191	SDValue t4 = DAG.getNode(ISD::FMUL, MVT::f32, t3, X);
				3192	SDValue t5 = DAG.getNode(ISD::FADD, MVT::f32, t4,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3193	getF32Constant(DAG, 0x4011cdf0));
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	3194	SDValue t6 = DAG.getNode(ISD::FMUL, MVT::f32, t5, X);
				3195	SDValue t7 = DAG.getNode(ISD::FSUB, MVT::f32, t6,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3196	getF32Constant(DAG, 0x406cfd1c));
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	3197	SDValue t8 = DAG.getNode(ISD::FMUL, MVT::f32, t7, X);
				3198	SDValue t9 = DAG.getNode(ISD::FADD, MVT::f32, t8,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3199	getF32Constant(DAG, 0x408797cb));
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	3200	SDValue t10 = DAG.getNode(ISD::FMUL, MVT::f32, t9, X);
				3201	SDValue LogOfMantissa = DAG.getNode(ISD::FSUB, MVT::f32, t10,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3202	getF32Constant(DAG, 0x4006dcab));
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	3203
				3204	result = DAG.getNode(ISD::FADD, MVT::f32, LogOfExponent, LogOfMantissa);
				3205	}
				3206	} else {
				3207	// No special expansion.
				3208	result = DAG.getNode(ISD::FLOG,
				3209	getValue(I.getOperand(1)).getValueType(),
				3210	getValue(I.getOperand(1)));
				3211	}
				3212
Dale Johannesen	59e577f	2008-09-05 18:38:42 +0000	[diff] [blame]	3213	setValue(&I, result);
				3214	}
				3215
Bill Wendling	3eb5940	2008-09-09 00:28:24 +0000	[diff] [blame]	3216	/// visitLog2 - Lower a log2 intrinsic. Handles the special sequences for
				3217	/// limited-precision mode.
Dale Johannesen	59e577f	2008-09-05 18:38:42 +0000	[diff] [blame]	3218	void
				3219	SelectionDAGLowering::visitLog2(CallInst &I) {
				3220	SDValue result;
Bill Wendling	3eb5940	2008-09-09 00:28:24 +0000	[diff] [blame]	3221
Dale Johannesen	853244f	2008-09-05 23:49:37 +0000	[diff] [blame]	3222	if (getValue(I.getOperand(1)).getValueType() == MVT::f32 &&
Bill Wendling	3eb5940	2008-09-09 00:28:24 +0000	[diff] [blame]	3223	LimitFloatPrecision > 0 && LimitFloatPrecision <= 18) {
				3224	SDValue Op = getValue(I.getOperand(1));
				3225	SDValue Op1 = DAG.getNode(ISD::BIT_CONVERT, MVT::i32, Op);
				3226
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	3227	// Get the exponent.
				3228	SDValue LogOfExponent = GetExponent(DAG, Op1);
Bill Wendling	3eb5940	2008-09-09 00:28:24 +0000	[diff] [blame]	3229
				3230	// Get the significand and build it into a floating-point number with
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	3231	// exponent of 1.
				3232	SDValue X = GetSignificand(DAG, Op1);
Bill Wendling	3eb5940	2008-09-09 00:28:24 +0000	[diff] [blame]	3233
				3234	// Different possible minimax approximations of significand in
				3235	// floating-point for various degrees of accuracy over [1,2].
				3236	if (LimitFloatPrecision <= 6) {
				3237	// For floating-point precision of 6:
				3238	//
				3239	// Log2ofMantissa = -1.6749035f + (2.0246817f - .34484768f * x) * x;
				3240	//
				3241	// error 0.0049451742, which is more than 7 bits
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	3242	SDValue t0 = DAG.getNode(ISD::FMUL, MVT::f32, X,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3243	getF32Constant(DAG, 0xbeb08fe0));
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	3244	SDValue t1 = DAG.getNode(ISD::FADD, MVT::f32, t0,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3245	getF32Constant(DAG, 0x40019463));
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	3246	SDValue t2 = DAG.getNode(ISD::FMUL, MVT::f32, t1, X);
				3247	SDValue Log2ofMantissa = DAG.getNode(ISD::FSUB, MVT::f32, t2,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3248	getF32Constant(DAG, 0x3fd6633d));
Bill Wendling	3eb5940	2008-09-09 00:28:24 +0000	[diff] [blame]	3249
				3250	result = DAG.getNode(ISD::FADD, MVT::f32, LogOfExponent, Log2ofMantissa);
				3251	} else if (LimitFloatPrecision > 6 && LimitFloatPrecision <= 12) {
				3252	// For floating-point precision of 12:
				3253	//
				3254	// Log2ofMantissa =
				3255	// -2.51285454f +
				3256	// (4.07009056f +
				3257	// (-2.12067489f +
				3258	// (.645142248f - 0.816157886e-1f * x) * x) * x) * x;
				3259	//
				3260	// error 0.0000876136000, which is better than 13 bits
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	3261	SDValue t0 = DAG.getNode(ISD::FMUL, MVT::f32, X,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3262	getF32Constant(DAG, 0xbda7262e));
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	3263	SDValue t1 = DAG.getNode(ISD::FADD, MVT::f32, t0,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3264	getF32Constant(DAG, 0x3f25280b));
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	3265	SDValue t2 = DAG.getNode(ISD::FMUL, MVT::f32, t1, X);
				3266	SDValue t3 = DAG.getNode(ISD::FSUB, MVT::f32, t2,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3267	getF32Constant(DAG, 0x4007b923));
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	3268	SDValue t4 = DAG.getNode(ISD::FMUL, MVT::f32, t3, X);
				3269	SDValue t5 = DAG.getNode(ISD::FADD, MVT::f32, t4,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3270	getF32Constant(DAG, 0x40823e2f));
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	3271	SDValue t6 = DAG.getNode(ISD::FMUL, MVT::f32, t5, X);
				3272	SDValue Log2ofMantissa = DAG.getNode(ISD::FSUB, MVT::f32, t6,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3273	getF32Constant(DAG, 0x4020d29c));
Bill Wendling	3eb5940	2008-09-09 00:28:24 +0000	[diff] [blame]	3274
				3275	result = DAG.getNode(ISD::FADD, MVT::f32, LogOfExponent, Log2ofMantissa);
				3276	} else { // LimitFloatPrecision > 12 && LimitFloatPrecision <= 18
				3277	// For floating-point precision of 18:
				3278	//
				3279	// Log2ofMantissa =
				3280	// -3.0400495f +
				3281	// (6.1129976f +
				3282	// (-5.3420409f +
				3283	// (3.2865683f +
				3284	// (-1.2669343f +
				3285	// (0.27515199f -
				3286	// 0.25691327e-1f * x) * x) * x) * x) * x) * x;
				3287	//
				3288	// error 0.0000018516, which is better than 18 bits
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	3289	SDValue t0 = DAG.getNode(ISD::FMUL, MVT::f32, X,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3290	getF32Constant(DAG, 0xbcd2769e));
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	3291	SDValue t1 = DAG.getNode(ISD::FADD, MVT::f32, t0,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3292	getF32Constant(DAG, 0x3e8ce0b9));
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	3293	SDValue t2 = DAG.getNode(ISD::FMUL, MVT::f32, t1, X);
				3294	SDValue t3 = DAG.getNode(ISD::FSUB, MVT::f32, t2,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3295	getF32Constant(DAG, 0x3fa22ae7));
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	3296	SDValue t4 = DAG.getNode(ISD::FMUL, MVT::f32, t3, X);
				3297	SDValue t5 = DAG.getNode(ISD::FADD, MVT::f32, t4,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3298	getF32Constant(DAG, 0x40525723));
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	3299	SDValue t6 = DAG.getNode(ISD::FMUL, MVT::f32, t5, X);
				3300	SDValue t7 = DAG.getNode(ISD::FSUB, MVT::f32, t6,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3301	getF32Constant(DAG, 0x40aaf200));
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	3302	SDValue t8 = DAG.getNode(ISD::FMUL, MVT::f32, t7, X);
				3303	SDValue t9 = DAG.getNode(ISD::FADD, MVT::f32, t8,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3304	getF32Constant(DAG, 0x40c39dad));
Bill Wendling	3eb5940	2008-09-09 00:28:24 +0000	[diff] [blame]	3305	SDValue t10 = DAG.getNode(ISD::FMUL, MVT::f32, t9, X);
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	3306	SDValue Log2ofMantissa = DAG.getNode(ISD::FSUB, MVT::f32, t10,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3307	getF32Constant(DAG, 0x4042902c));
Bill Wendling	3eb5940	2008-09-09 00:28:24 +0000	[diff] [blame]	3308
				3309	result = DAG.getNode(ISD::FADD, MVT::f32, LogOfExponent, Log2ofMantissa);
				3310	}
Dale Johannesen	853244f	2008-09-05 23:49:37 +0000	[diff] [blame]	3311	} else {
Bill Wendling	3eb5940	2008-09-09 00:28:24 +0000	[diff] [blame]	3312	// No special expansion.
Dale Johannesen	853244f	2008-09-05 23:49:37 +0000	[diff] [blame]	3313	result = DAG.getNode(ISD::FLOG2,
				3314	getValue(I.getOperand(1)).getValueType(),
				3315	getValue(I.getOperand(1)));
				3316	}
Bill Wendling	3eb5940	2008-09-09 00:28:24 +0000	[diff] [blame]	3317
Dale Johannesen	59e577f	2008-09-05 18:38:42 +0000	[diff] [blame]	3318	setValue(&I, result);
				3319	}
				3320
Bill Wendling	3eb5940	2008-09-09 00:28:24 +0000	[diff] [blame]	3321	/// visitLog10 - Lower a log10 intrinsic. Handles the special sequences for
				3322	/// limited-precision mode.
Dale Johannesen	59e577f	2008-09-05 18:38:42 +0000	[diff] [blame]	3323	void
				3324	SelectionDAGLowering::visitLog10(CallInst &I) {
				3325	SDValue result;
Bill Wendling	181b627	2008-10-19 20:34:04 +0000	[diff] [blame]	3326
Dale Johannesen	852680a	2008-09-05 21:27:19 +0000	[diff] [blame]	3327	if (getValue(I.getOperand(1)).getValueType() == MVT::f32 &&
Bill Wendling	3eb5940	2008-09-09 00:28:24 +0000	[diff] [blame]	3328	LimitFloatPrecision > 0 && LimitFloatPrecision <= 18) {
				3329	SDValue Op = getValue(I.getOperand(1));
				3330	SDValue Op1 = DAG.getNode(ISD::BIT_CONVERT, MVT::i32, Op);
				3331
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	3332	// Scale the exponent by log10(2) [0.30102999f].
				3333	SDValue Exp = GetExponent(DAG, Op1);
				3334	SDValue LogOfExponent = DAG.getNode(ISD::FMUL, MVT::f32, Exp,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3335	getF32Constant(DAG, 0x3e9a209a));
Bill Wendling	3eb5940	2008-09-09 00:28:24 +0000	[diff] [blame]	3336
				3337	// Get the significand and build it into a floating-point number with
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	3338	// exponent of 1.
				3339	SDValue X = GetSignificand(DAG, Op1);
Bill Wendling	3eb5940	2008-09-09 00:28:24 +0000	[diff] [blame]	3340
				3341	if (LimitFloatPrecision <= 6) {
Bill Wendling	bd297bc	2008-09-09 18:42:23 +0000	[diff] [blame]	3342	// For floating-point precision of 6:
				3343	//
				3344	// Log10ofMantissa =
				3345	// -0.50419619f +
				3346	// (0.60948995f - 0.10380950f * x) * x;
				3347	//
				3348	// error 0.0014886165, which is 6 bits
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	3349	SDValue t0 = DAG.getNode(ISD::FMUL, MVT::f32, X,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3350	getF32Constant(DAG, 0xbdd49a13));
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	3351	SDValue t1 = DAG.getNode(ISD::FADD, MVT::f32, t0,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3352	getF32Constant(DAG, 0x3f1c0789));
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	3353	SDValue t2 = DAG.getNode(ISD::FMUL, MVT::f32, t1, X);
				3354	SDValue Log10ofMantissa = DAG.getNode(ISD::FSUB, MVT::f32, t2,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3355	getF32Constant(DAG, 0x3f011300));
Bill Wendling	bd297bc	2008-09-09 18:42:23 +0000	[diff] [blame]	3356
				3357	result = DAG.getNode(ISD::FADD, MVT::f32, LogOfExponent, Log10ofMantissa);
Bill Wendling	3eb5940	2008-09-09 00:28:24 +0000	[diff] [blame]	3358	} else if (LimitFloatPrecision > 6 && LimitFloatPrecision <= 12) {
				3359	// For floating-point precision of 12:
				3360	//
				3361	// Log10ofMantissa =
				3362	// -0.64831180f +
				3363	// (0.91751397f +
				3364	// (-0.31664806f + 0.47637168e-1f * x) * x) * x;
				3365	//
				3366	// error 0.00019228036, which is better than 12 bits
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	3367	SDValue t0 = DAG.getNode(ISD::FMUL, MVT::f32, X,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3368	getF32Constant(DAG, 0x3d431f31));
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	3369	SDValue t1 = DAG.getNode(ISD::FSUB, MVT::f32, t0,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3370	getF32Constant(DAG, 0x3ea21fb2));
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	3371	SDValue t2 = DAG.getNode(ISD::FMUL, MVT::f32, t1, X);
				3372	SDValue t3 = DAG.getNode(ISD::FADD, MVT::f32, t2,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3373	getF32Constant(DAG, 0x3f6ae232));
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	3374	SDValue t4 = DAG.getNode(ISD::FMUL, MVT::f32, t3, X);
				3375	SDValue Log10ofMantissa = DAG.getNode(ISD::FSUB, MVT::f32, t4,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3376	getF32Constant(DAG, 0x3f25f7c3));
Bill Wendling	3eb5940	2008-09-09 00:28:24 +0000	[diff] [blame]	3377
				3378	result = DAG.getNode(ISD::FADD, MVT::f32, LogOfExponent, Log10ofMantissa);
				3379	} else { // LimitFloatPrecision > 12 && LimitFloatPrecision <= 18
Bill Wendling	bd297bc	2008-09-09 18:42:23 +0000	[diff] [blame]	3380	// For floating-point precision of 18:
				3381	//
				3382	// Log10ofMantissa =
				3383	// -0.84299375f +
				3384	// (1.5327582f +
				3385	// (-1.0688956f +
				3386	// (0.49102474f +
				3387	// (-0.12539807f + 0.13508273e-1f * x) * x) * x) * x) * x;
				3388	//
				3389	// error 0.0000037995730, which is better than 18 bits
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	3390	SDValue t0 = DAG.getNode(ISD::FMUL, MVT::f32, X,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3391	getF32Constant(DAG, 0x3c5d51ce));
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	3392	SDValue t1 = DAG.getNode(ISD::FSUB, MVT::f32, t0,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3393	getF32Constant(DAG, 0x3e00685a));
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	3394	SDValue t2 = DAG.getNode(ISD::FMUL, MVT::f32, t1, X);
				3395	SDValue t3 = DAG.getNode(ISD::FADD, MVT::f32, t2,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3396	getF32Constant(DAG, 0x3efb6798));
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	3397	SDValue t4 = DAG.getNode(ISD::FMUL, MVT::f32, t3, X);
				3398	SDValue t5 = DAG.getNode(ISD::FSUB, MVT::f32, t4,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3399	getF32Constant(DAG, 0x3f88d192));
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	3400	SDValue t6 = DAG.getNode(ISD::FMUL, MVT::f32, t5, X);
				3401	SDValue t7 = DAG.getNode(ISD::FADD, MVT::f32, t6,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3402	getF32Constant(DAG, 0x3fc4316c));
Bill Wendling	bd297bc	2008-09-09 18:42:23 +0000	[diff] [blame]	3403	SDValue t8 = DAG.getNode(ISD::FMUL, MVT::f32, t7, X);
Bill Wendling	3915025	2008-09-09 20:39:27 +0000	[diff] [blame]	3404	SDValue Log10ofMantissa = DAG.getNode(ISD::FSUB, MVT::f32, t8,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3405	getF32Constant(DAG, 0x3f57ce70));
Bill Wendling	bd297bc	2008-09-09 18:42:23 +0000	[diff] [blame]	3406
				3407	result = DAG.getNode(ISD::FADD, MVT::f32, LogOfExponent, Log10ofMantissa);
Bill Wendling	3eb5940	2008-09-09 00:28:24 +0000	[diff] [blame]	3408	}
Dale Johannesen	852680a	2008-09-05 21:27:19 +0000	[diff] [blame]	3409	} else {
Bill Wendling	3eb5940	2008-09-09 00:28:24 +0000	[diff] [blame]	3410	// No special expansion.
Dale Johannesen	852680a	2008-09-05 21:27:19 +0000	[diff] [blame]	3411	result = DAG.getNode(ISD::FLOG10,
				3412	getValue(I.getOperand(1)).getValueType(),
				3413	getValue(I.getOperand(1)));
				3414	}
Bill Wendling	3eb5940	2008-09-09 00:28:24 +0000	[diff] [blame]	3415
Dale Johannesen	59e577f	2008-09-05 18:38:42 +0000	[diff] [blame]	3416	setValue(&I, result);
				3417	}
				3418
Bill Wendling	e10c814	2008-09-09 22:39:21 +0000	[diff] [blame]	3419	/// visitExp2 - Lower an exp2 intrinsic. Handles the special sequences for
				3420	/// limited-precision mode.
Dale Johannesen	601d3c0	2008-09-05 01:48:15 +0000	[diff] [blame]	3421	void
				3422	SelectionDAGLowering::visitExp2(CallInst &I) {
				3423	SDValue result;
Bill Wendling	e10c814	2008-09-09 22:39:21 +0000	[diff] [blame]	3424
Dale Johannesen	601d3c0	2008-09-05 01:48:15 +0000	[diff] [blame]	3425	if (getValue(I.getOperand(1)).getValueType() == MVT::f32 &&
Bill Wendling	e10c814	2008-09-09 22:39:21 +0000	[diff] [blame]	3426	LimitFloatPrecision > 0 && LimitFloatPrecision <= 18) {
				3427	SDValue Op = getValue(I.getOperand(1));
				3428
				3429	SDValue IntegerPartOfX = DAG.getNode(ISD::FP_TO_SINT, MVT::i32, Op);
				3430
				3431	// FractionalPartOfX = x - (float)IntegerPartOfX;
				3432	SDValue t1 = DAG.getNode(ISD::SINT_TO_FP, MVT::f32, IntegerPartOfX);
				3433	SDValue X = DAG.getNode(ISD::FSUB, MVT::f32, Op, t1);
				3434
				3435	// IntegerPartOfX <<= 23;
				3436	IntegerPartOfX = DAG.getNode(ISD::SHL, MVT::i32, IntegerPartOfX,
				3437	DAG.getConstant(23, MVT::i32));
				3438
				3439	if (LimitFloatPrecision <= 6) {
				3440	// For floating-point precision of 6:
				3441	//
				3442	// TwoToFractionalPartOfX =
				3443	// 0.997535578f +
				3444	// (0.735607626f + 0.252464424f * x) * x;
				3445	//
				3446	// error 0.0144103317, which is 6 bits
				3447	SDValue t2 = DAG.getNode(ISD::FMUL, MVT::f32, X,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3448	getF32Constant(DAG, 0x3e814304));
Bill Wendling	e10c814	2008-09-09 22:39:21 +0000	[diff] [blame]	3449	SDValue t3 = DAG.getNode(ISD::FADD, MVT::f32, t2,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3450	getF32Constant(DAG, 0x3f3c50c8));
Bill Wendling	e10c814	2008-09-09 22:39:21 +0000	[diff] [blame]	3451	SDValue t4 = DAG.getNode(ISD::FMUL, MVT::f32, t3, X);
				3452	SDValue t5 = DAG.getNode(ISD::FADD, MVT::f32, t4,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3453	getF32Constant(DAG, 0x3f7f5e7e));
Bill Wendling	e10c814	2008-09-09 22:39:21 +0000	[diff] [blame]	3454	SDValue t6 = DAG.getNode(ISD::BIT_CONVERT, MVT::i32, t5);
				3455	SDValue TwoToFractionalPartOfX =
				3456	DAG.getNode(ISD::ADD, MVT::i32, t6, IntegerPartOfX);
				3457
				3458	result = DAG.getNode(ISD::BIT_CONVERT, MVT::f32, TwoToFractionalPartOfX);
				3459	} else if (LimitFloatPrecision > 6 && LimitFloatPrecision <= 12) {
				3460	// For floating-point precision of 12:
				3461	//
				3462	// TwoToFractionalPartOfX =
				3463	// 0.999892986f +
				3464	// (0.696457318f +
				3465	// (0.224338339f + 0.792043434e-1f * x) * x) * x;
				3466	//
				3467	// error 0.000107046256, which is 13 to 14 bits
				3468	SDValue t2 = DAG.getNode(ISD::FMUL, MVT::f32, X,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3469	getF32Constant(DAG, 0x3da235e3));
Bill Wendling	e10c814	2008-09-09 22:39:21 +0000	[diff] [blame]	3470	SDValue t3 = DAG.getNode(ISD::FADD, MVT::f32, t2,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3471	getF32Constant(DAG, 0x3e65b8f3));
Bill Wendling	e10c814	2008-09-09 22:39:21 +0000	[diff] [blame]	3472	SDValue t4 = DAG.getNode(ISD::FMUL, MVT::f32, t3, X);
				3473	SDValue t5 = DAG.getNode(ISD::FADD, MVT::f32, t4,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3474	getF32Constant(DAG, 0x3f324b07));
Bill Wendling	e10c814	2008-09-09 22:39:21 +0000	[diff] [blame]	3475	SDValue t6 = DAG.getNode(ISD::FMUL, MVT::f32, t5, X);
				3476	SDValue t7 = DAG.getNode(ISD::FADD, MVT::f32, t6,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3477	getF32Constant(DAG, 0x3f7ff8fd));
Bill Wendling	e10c814	2008-09-09 22:39:21 +0000	[diff] [blame]	3478	SDValue t8 = DAG.getNode(ISD::BIT_CONVERT, MVT::i32, t7);
				3479	SDValue TwoToFractionalPartOfX =
				3480	DAG.getNode(ISD::ADD, MVT::i32, t8, IntegerPartOfX);
				3481
				3482	result = DAG.getNode(ISD::BIT_CONVERT, MVT::f32, TwoToFractionalPartOfX);
				3483	} else { // LimitFloatPrecision > 12 && LimitFloatPrecision <= 18
				3484	// For floating-point precision of 18:
				3485	//
				3486	// TwoToFractionalPartOfX =
				3487	// 0.999999982f +
				3488	// (0.693148872f +
				3489	// (0.240227044f +
				3490	// (0.554906021e-1f +
				3491	// (0.961591928e-2f +
				3492	// (0.136028312e-2f + 0.157059148e-3f x)x)x)x)x)x;
				3493	// error 2.47208000*10^(-7), which is better than 18 bits
				3494	SDValue t2 = DAG.getNode(ISD::FMUL, MVT::f32, X,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3495	getF32Constant(DAG, 0x3924b03e));
Bill Wendling	e10c814	2008-09-09 22:39:21 +0000	[diff] [blame]	3496	SDValue t3 = DAG.getNode(ISD::FADD, MVT::f32, t2,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3497	getF32Constant(DAG, 0x3ab24b87));
Bill Wendling	e10c814	2008-09-09 22:39:21 +0000	[diff] [blame]	3498	SDValue t4 = DAG.getNode(ISD::FMUL, MVT::f32, t3, X);
				3499	SDValue t5 = DAG.getNode(ISD::FADD, MVT::f32, t4,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3500	getF32Constant(DAG, 0x3c1d8c17));
Bill Wendling	e10c814	2008-09-09 22:39:21 +0000	[diff] [blame]	3501	SDValue t6 = DAG.getNode(ISD::FMUL, MVT::f32, t5, X);
				3502	SDValue t7 = DAG.getNode(ISD::FADD, MVT::f32, t6,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3503	getF32Constant(DAG, 0x3d634a1d));
Bill Wendling	e10c814	2008-09-09 22:39:21 +0000	[diff] [blame]	3504	SDValue t8 = DAG.getNode(ISD::FMUL, MVT::f32, t7, X);
				3505	SDValue t9 = DAG.getNode(ISD::FADD, MVT::f32, t8,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3506	getF32Constant(DAG, 0x3e75fe14));
Bill Wendling	e10c814	2008-09-09 22:39:21 +0000	[diff] [blame]	3507	SDValue t10 = DAG.getNode(ISD::FMUL, MVT::f32, t9, X);
				3508	SDValue t11 = DAG.getNode(ISD::FADD, MVT::f32, t10,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3509	getF32Constant(DAG, 0x3f317234));
Bill Wendling	e10c814	2008-09-09 22:39:21 +0000	[diff] [blame]	3510	SDValue t12 = DAG.getNode(ISD::FMUL, MVT::f32, t11, X);
				3511	SDValue t13 = DAG.getNode(ISD::FADD, MVT::f32, t12,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3512	getF32Constant(DAG, 0x3f800000));
Bill Wendling	e10c814	2008-09-09 22:39:21 +0000	[diff] [blame]	3513	SDValue t14 = DAG.getNode(ISD::BIT_CONVERT, MVT::i32, t13);
				3514	SDValue TwoToFractionalPartOfX =
				3515	DAG.getNode(ISD::ADD, MVT::i32, t14, IntegerPartOfX);
				3516
				3517	result = DAG.getNode(ISD::BIT_CONVERT, MVT::f32, TwoToFractionalPartOfX);
				3518	}
Dale Johannesen	601d3c0	2008-09-05 01:48:15 +0000	[diff] [blame]	3519	} else {
Bill Wendling	3eb5940	2008-09-09 00:28:24 +0000	[diff] [blame]	3520	// No special expansion.
Dale Johannesen	601d3c0	2008-09-05 01:48:15 +0000	[diff] [blame]	3521	result = DAG.getNode(ISD::FEXP2,
				3522	getValue(I.getOperand(1)).getValueType(),
				3523	getValue(I.getOperand(1)));
				3524	}
Bill Wendling	e10c814	2008-09-09 22:39:21 +0000	[diff] [blame]	3525
Dale Johannesen	601d3c0	2008-09-05 01:48:15 +0000	[diff] [blame]	3526	setValue(&I, result);
				3527	}
				3528
Bill Wendling	aeb5c7b	2008-09-10 00:20:20 +0000	[diff] [blame]	3529	/// visitPow - Lower a pow intrinsic. Handles the special sequences for
				3530	/// limited-precision mode with x == 10.0f.
				3531	void
				3532	SelectionDAGLowering::visitPow(CallInst &I) {
				3533	SDValue result;
				3534	Value *Val = I.getOperand(1);
				3535	bool IsExp10 = false;
				3536
				3537	if (getValue(Val).getValueType() == MVT::f32 &&
Bill Wendling	277fc24	2008-09-10 00:24:59 +0000	[diff] [blame]	3538	getValue(I.getOperand(2)).getValueType() == MVT::f32 &&
Bill Wendling	aeb5c7b	2008-09-10 00:20:20 +0000	[diff] [blame]	3539	LimitFloatPrecision > 0 && LimitFloatPrecision <= 18) {
				3540	if (Constant C = const_cast<Constant>(dyn_cast<Constant>(Val))) {
				3541	if (ConstantFP *CFP = dyn_cast<ConstantFP>(C)) {
				3542	APFloat Ten(10.0f);
				3543	IsExp10 = CFP->getValueAPF().bitwiseIsEqual(Ten);
				3544	}
				3545	}
				3546	}
				3547
				3548	if (IsExp10 && LimitFloatPrecision > 0 && LimitFloatPrecision <= 18) {
				3549	SDValue Op = getValue(I.getOperand(2));
				3550
				3551	// Put the exponent in the right bit position for later addition to the
				3552	// final result:
				3553	//
				3554	// #define LOG2OF10 3.3219281f
				3555	// IntegerPartOfX = (int32_t)(x * LOG2OF10);
				3556	SDValue t0 = DAG.getNode(ISD::FMUL, MVT::f32, Op,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3557	getF32Constant(DAG, 0x40549a78));
Bill Wendling	aeb5c7b	2008-09-10 00:20:20 +0000	[diff] [blame]	3558	SDValue IntegerPartOfX = DAG.getNode(ISD::FP_TO_SINT, MVT::i32, t0);
				3559
				3560	// FractionalPartOfX = x - (float)IntegerPartOfX;
				3561	SDValue t1 = DAG.getNode(ISD::SINT_TO_FP, MVT::f32, IntegerPartOfX);
				3562	SDValue X = DAG.getNode(ISD::FSUB, MVT::f32, t0, t1);
				3563
				3564	// IntegerPartOfX <<= 23;
				3565	IntegerPartOfX = DAG.getNode(ISD::SHL, MVT::i32, IntegerPartOfX,
				3566	DAG.getConstant(23, MVT::i32));
				3567
				3568	if (LimitFloatPrecision <= 6) {
				3569	// For floating-point precision of 6:
				3570	//
				3571	// twoToFractionalPartOfX =
				3572	// 0.997535578f +
				3573	// (0.735607626f + 0.252464424f * x) * x;
				3574	//
				3575	// error 0.0144103317, which is 6 bits
				3576	SDValue t2 = DAG.getNode(ISD::FMUL, MVT::f32, X,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3577	getF32Constant(DAG, 0x3e814304));
Bill Wendling	aeb5c7b	2008-09-10 00:20:20 +0000	[diff] [blame]	3578	SDValue t3 = DAG.getNode(ISD::FADD, MVT::f32, t2,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3579	getF32Constant(DAG, 0x3f3c50c8));
Bill Wendling	aeb5c7b	2008-09-10 00:20:20 +0000	[diff] [blame]	3580	SDValue t4 = DAG.getNode(ISD::FMUL, MVT::f32, t3, X);
				3581	SDValue t5 = DAG.getNode(ISD::FADD, MVT::f32, t4,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3582	getF32Constant(DAG, 0x3f7f5e7e));
Bill Wendling	aeb5c7b	2008-09-10 00:20:20 +0000	[diff] [blame]	3583	SDValue t6 = DAG.getNode(ISD::BIT_CONVERT, MVT::i32, t5);
				3584	SDValue TwoToFractionalPartOfX =
				3585	DAG.getNode(ISD::ADD, MVT::i32, t6, IntegerPartOfX);
				3586
				3587	result = DAG.getNode(ISD::BIT_CONVERT, MVT::f32, TwoToFractionalPartOfX);
				3588	} else if (LimitFloatPrecision > 6 && LimitFloatPrecision <= 12) {
				3589	// For floating-point precision of 12:
				3590	//
				3591	// TwoToFractionalPartOfX =
				3592	// 0.999892986f +
				3593	// (0.696457318f +
				3594	// (0.224338339f + 0.792043434e-1f * x) * x) * x;
				3595	//
				3596	// error 0.000107046256, which is 13 to 14 bits
				3597	SDValue t2 = DAG.getNode(ISD::FMUL, MVT::f32, X,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3598	getF32Constant(DAG, 0x3da235e3));
Bill Wendling	aeb5c7b	2008-09-10 00:20:20 +0000	[diff] [blame]	3599	SDValue t3 = DAG.getNode(ISD::FADD, MVT::f32, t2,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3600	getF32Constant(DAG, 0x3e65b8f3));
Bill Wendling	aeb5c7b	2008-09-10 00:20:20 +0000	[diff] [blame]	3601	SDValue t4 = DAG.getNode(ISD::FMUL, MVT::f32, t3, X);
				3602	SDValue t5 = DAG.getNode(ISD::FADD, MVT::f32, t4,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3603	getF32Constant(DAG, 0x3f324b07));
Bill Wendling	aeb5c7b	2008-09-10 00:20:20 +0000	[diff] [blame]	3604	SDValue t6 = DAG.getNode(ISD::FMUL, MVT::f32, t5, X);
				3605	SDValue t7 = DAG.getNode(ISD::FADD, MVT::f32, t6,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3606	getF32Constant(DAG, 0x3f7ff8fd));
Bill Wendling	aeb5c7b	2008-09-10 00:20:20 +0000	[diff] [blame]	3607	SDValue t8 = DAG.getNode(ISD::BIT_CONVERT, MVT::i32, t7);
				3608	SDValue TwoToFractionalPartOfX =
				3609	DAG.getNode(ISD::ADD, MVT::i32, t8, IntegerPartOfX);
				3610
				3611	result = DAG.getNode(ISD::BIT_CONVERT, MVT::f32, TwoToFractionalPartOfX);
				3612	} else { // LimitFloatPrecision > 12 && LimitFloatPrecision <= 18
				3613	// For floating-point precision of 18:
				3614	//
				3615	// TwoToFractionalPartOfX =
				3616	// 0.999999982f +
				3617	// (0.693148872f +
				3618	// (0.240227044f +
				3619	// (0.554906021e-1f +
				3620	// (0.961591928e-2f +
				3621	// (0.136028312e-2f + 0.157059148e-3f x)x)x)x)x)x;
				3622	// error 2.47208000*10^(-7), which is better than 18 bits
				3623	SDValue t2 = DAG.getNode(ISD::FMUL, MVT::f32, X,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3624	getF32Constant(DAG, 0x3924b03e));
Bill Wendling	aeb5c7b	2008-09-10 00:20:20 +0000	[diff] [blame]	3625	SDValue t3 = DAG.getNode(ISD::FADD, MVT::f32, t2,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3626	getF32Constant(DAG, 0x3ab24b87));
Bill Wendling	aeb5c7b	2008-09-10 00:20:20 +0000	[diff] [blame]	3627	SDValue t4 = DAG.getNode(ISD::FMUL, MVT::f32, t3, X);
				3628	SDValue t5 = DAG.getNode(ISD::FADD, MVT::f32, t4,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3629	getF32Constant(DAG, 0x3c1d8c17));
Bill Wendling	aeb5c7b	2008-09-10 00:20:20 +0000	[diff] [blame]	3630	SDValue t6 = DAG.getNode(ISD::FMUL, MVT::f32, t5, X);
				3631	SDValue t7 = DAG.getNode(ISD::FADD, MVT::f32, t6,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3632	getF32Constant(DAG, 0x3d634a1d));
Bill Wendling	aeb5c7b	2008-09-10 00:20:20 +0000	[diff] [blame]	3633	SDValue t8 = DAG.getNode(ISD::FMUL, MVT::f32, t7, X);
				3634	SDValue t9 = DAG.getNode(ISD::FADD, MVT::f32, t8,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3635	getF32Constant(DAG, 0x3e75fe14));
Bill Wendling	aeb5c7b	2008-09-10 00:20:20 +0000	[diff] [blame]	3636	SDValue t10 = DAG.getNode(ISD::FMUL, MVT::f32, t9, X);
				3637	SDValue t11 = DAG.getNode(ISD::FADD, MVT::f32, t10,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3638	getF32Constant(DAG, 0x3f317234));
Bill Wendling	aeb5c7b	2008-09-10 00:20:20 +0000	[diff] [blame]	3639	SDValue t12 = DAG.getNode(ISD::FMUL, MVT::f32, t11, X);
				3640	SDValue t13 = DAG.getNode(ISD::FADD, MVT::f32, t12,
Bill Wendling	cd4c73a	2008-09-22 00:44:35 +0000	[diff] [blame]	3641	getF32Constant(DAG, 0x3f800000));
Bill Wendling	aeb5c7b	2008-09-10 00:20:20 +0000	[diff] [blame]	3642	SDValue t14 = DAG.getNode(ISD::BIT_CONVERT, MVT::i32, t13);
				3643	SDValue TwoToFractionalPartOfX =
				3644	DAG.getNode(ISD::ADD, MVT::i32, t14, IntegerPartOfX);
				3645
				3646	result = DAG.getNode(ISD::BIT_CONVERT, MVT::f32, TwoToFractionalPartOfX);
				3647	}
				3648	} else {
				3649	// No special expansion.
				3650	result = DAG.getNode(ISD::FPOW,
				3651	getValue(I.getOperand(1)).getValueType(),
				3652	getValue(I.getOperand(1)),
				3653	getValue(I.getOperand(2)));
				3654	}
				3655
				3656	setValue(&I, result);
				3657	}
				3658
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	3659	/// visitIntrinsicCall - Lower the call to the specified intrinsic function. If
				3660	/// we want to emit this as a call to a named external function, return the name
				3661	/// otherwise lower it and return null.
				3662	const char *
				3663	SelectionDAGLowering::visitIntrinsicCall(CallInst &I, unsigned Intrinsic) {
				3664	switch (Intrinsic) {
				3665	default:
				3666	// By default, turn this into a target intrinsic node.
				3667	visitTargetIntrinsic(I, Intrinsic);
				3668	return 0;
				3669	case Intrinsic::vastart: visitVAStart(I); return 0;
				3670	case Intrinsic::vaend: visitVAEnd(I); return 0;
				3671	case Intrinsic::vacopy: visitVACopy(I); return 0;
				3672	case Intrinsic::returnaddress:
				3673	setValue(&I, DAG.getNode(ISD::RETURNADDR, TLI.getPointerTy(),
				3674	getValue(I.getOperand(1))));
				3675	return 0;
Bill Wendling	d5d8191	2008-09-26 22:10:44 +0000	[diff] [blame]	3676	case Intrinsic::frameaddress:
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	3677	setValue(&I, DAG.getNode(ISD::FRAMEADDR, TLI.getPointerTy(),
				3678	getValue(I.getOperand(1))));
				3679	return 0;
				3680	case Intrinsic::setjmp:
				3681	return "_setjmp"+!TLI.usesUnderscoreSetJmp();
				3682	break;
				3683	case Intrinsic::longjmp:
				3684	return "_longjmp"+!TLI.usesUnderscoreLongJmp();
				3685	break;
Chris Lattner	824b958	2008-11-21 16:42:48 +0000	[diff] [blame]	3686	case Intrinsic::memcpy: {
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	3687	SDValue Op1 = getValue(I.getOperand(1));
				3688	SDValue Op2 = getValue(I.getOperand(2));
				3689	SDValue Op3 = getValue(I.getOperand(3));
				3690	unsigned Align = cast<ConstantInt>(I.getOperand(4))->getZExtValue();
				3691	DAG.setRoot(DAG.getMemcpy(getRoot(), Op1, Op2, Op3, Align, false,
				3692	I.getOperand(1), 0, I.getOperand(2), 0));
				3693	return 0;
				3694	}
Chris Lattner	824b958	2008-11-21 16:42:48 +0000	[diff] [blame]	3695	case Intrinsic::memset: {
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	3696	SDValue Op1 = getValue(I.getOperand(1));
				3697	SDValue Op2 = getValue(I.getOperand(2));
				3698	SDValue Op3 = getValue(I.getOperand(3));
				3699	unsigned Align = cast<ConstantInt>(I.getOperand(4))->getZExtValue();
				3700	DAG.setRoot(DAG.getMemset(getRoot(), Op1, Op2, Op3, Align,
				3701	I.getOperand(1), 0));
				3702	return 0;
				3703	}
Chris Lattner	824b958	2008-11-21 16:42:48 +0000	[diff] [blame]	3704	case Intrinsic::memmove: {
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	3705	SDValue Op1 = getValue(I.getOperand(1));
				3706	SDValue Op2 = getValue(I.getOperand(2));
				3707	SDValue Op3 = getValue(I.getOperand(3));
				3708	unsigned Align = cast<ConstantInt>(I.getOperand(4))->getZExtValue();
				3709
				3710	// If the source and destination are known to not be aliases, we can
				3711	// lower memmove as memcpy.
				3712	uint64_t Size = -1ULL;
				3713	if (ConstantSDNode *C = dyn_cast<ConstantSDNode>(Op3))
Dan Gohman	f5aeb1a	2008-09-12 16:56:44 +0000	[diff] [blame]	3714	Size = C->getZExtValue();
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	3715	if (AA->alias(I.getOperand(1), Size, I.getOperand(2), Size) ==
				3716	AliasAnalysis::NoAlias) {
				3717	DAG.setRoot(DAG.getMemcpy(getRoot(), Op1, Op2, Op3, Align, false,
				3718	I.getOperand(1), 0, I.getOperand(2), 0));
				3719	return 0;
				3720	}
				3721
				3722	DAG.setRoot(DAG.getMemmove(getRoot(), Op1, Op2, Op3, Align,
				3723	I.getOperand(1), 0, I.getOperand(2), 0));
				3724	return 0;
				3725	}
				3726	case Intrinsic::dbg_stoppoint: {
				3727	MachineModuleInfo *MMI = DAG.getMachineModuleInfo();
				3728	DbgStopPointInst &SPI = cast<DbgStopPointInst>(I);
				3729	if (MMI && SPI.getContext() && MMI->Verify(SPI.getContext())) {
				3730	DebugInfoDesc *DD = MMI->getDescFor(SPI.getContext());
				3731	assert(DD && "Not a debug information descriptor");
				3732	DAG.setRoot(DAG.getDbgStopPoint(getRoot(),
				3733	SPI.getLine(),
				3734	SPI.getColumn(),
				3735	cast<CompileUnitDesc>(DD)));
				3736	}
				3737
				3738	return 0;
				3739	}
				3740	case Intrinsic::dbg_region_start: {
				3741	MachineModuleInfo *MMI = DAG.getMachineModuleInfo();
				3742	DbgRegionStartInst &RSI = cast<DbgRegionStartInst>(I);
				3743	if (MMI && RSI.getContext() && MMI->Verify(RSI.getContext())) {
				3744	unsigned LabelID = MMI->RecordRegionStart(RSI.getContext());
				3745	DAG.setRoot(DAG.getLabel(ISD::DBG_LABEL, getRoot(), LabelID));
				3746	}
				3747
				3748	return 0;
				3749	}
				3750	case Intrinsic::dbg_region_end: {
				3751	MachineModuleInfo *MMI = DAG.getMachineModuleInfo();
				3752	DbgRegionEndInst &REI = cast<DbgRegionEndInst>(I);
				3753	if (MMI && REI.getContext() && MMI->Verify(REI.getContext())) {
				3754	unsigned LabelID = MMI->RecordRegionEnd(REI.getContext());
				3755	DAG.setRoot(DAG.getLabel(ISD::DBG_LABEL, getRoot(), LabelID));
				3756	}
				3757
				3758	return 0;
				3759	}
				3760	case Intrinsic::dbg_func_start: {
				3761	MachineModuleInfo *MMI = DAG.getMachineModuleInfo();
				3762	if (!MMI) return 0;
				3763	DbgFuncStartInst &FSI = cast<DbgFuncStartInst>(I);
				3764	Value *SP = FSI.getSubprogram();
				3765	if (SP && MMI->Verify(SP)) {
				3766	// llvm.dbg.func.start implicitly defines a dbg_stoppoint which is
				3767	// what (most?) gdb expects.
				3768	DebugInfoDesc *DD = MMI->getDescFor(SP);
				3769	assert(DD && "Not a debug information descriptor");
				3770	SubprogramDesc *Subprogram = cast<SubprogramDesc>(DD);
				3771	const CompileUnitDesc *CompileUnit = Subprogram->getFile();
				3772	unsigned SrcFile = MMI->RecordSource(CompileUnit);
Devang Patel	20dd046	2008-11-06 00:30:09 +0000	[diff] [blame]	3773	// Record the source line but does not create a label for the normal
				3774	// function start. It will be emitted at asm emission time. However,
				3775	// create a label if this is a beginning of inlined function.
				3776	unsigned LabelID = MMI->RecordSourceLine(Subprogram->getLine(), 0, SrcFile);
				3777	if (MMI->getSourceLines().size() != 1)
				3778	DAG.setRoot(DAG.getLabel(ISD::DBG_LABEL, getRoot(), LabelID));
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	3779	}
				3780
				3781	return 0;
				3782	}
				3783	case Intrinsic::dbg_declare: {
				3784	MachineModuleInfo *MMI = DAG.getMachineModuleInfo();
				3785	DbgDeclareInst &DI = cast<DbgDeclareInst>(I);
				3786	Value *Variable = DI.getVariable();
				3787	if (MMI && Variable && MMI->Verify(Variable))
				3788	DAG.setRoot(DAG.getNode(ISD::DECLARE, MVT::Other, getRoot(),
				3789	getValue(DI.getAddress()), getValue(Variable)));
				3790	return 0;
				3791	}
				3792
				3793	case Intrinsic::eh_exception: {
				3794	if (!CurMBB->isLandingPad()) {
				3795	// FIXME: Mark exception register as live in. Hack for PR1508.
				3796	unsigned Reg = TLI.getExceptionAddressRegister();
				3797	if (Reg) CurMBB->addLiveIn(Reg);
				3798	}
				3799	// Insert the EXCEPTIONADDR instruction.
				3800	SDVTList VTs = DAG.getVTList(TLI.getPointerTy(), MVT::Other);
				3801	SDValue Ops[1];
				3802	Ops[0] = DAG.getRoot();
				3803	SDValue Op = DAG.getNode(ISD::EXCEPTIONADDR, VTs, Ops, 1);
				3804	setValue(&I, Op);
				3805	DAG.setRoot(Op.getValue(1));
				3806	return 0;
				3807	}
				3808
				3809	case Intrinsic::eh_selector_i32:
				3810	case Intrinsic::eh_selector_i64: {
				3811	MachineModuleInfo *MMI = DAG.getMachineModuleInfo();
				3812	MVT VT = (Intrinsic == Intrinsic::eh_selector_i32 ?
				3813	MVT::i32 : MVT::i64);
				3814
				3815	if (MMI) {
				3816	if (CurMBB->isLandingPad())
				3817	AddCatchInfo(I, MMI, CurMBB);
				3818	else {
				3819	#ifndef NDEBUG
				3820	FuncInfo.CatchInfoLost.insert(&I);
				3821	#endif
				3822	// FIXME: Mark exception selector register as live in. Hack for PR1508.
				3823	unsigned Reg = TLI.getExceptionSelectorRegister();
				3824	if (Reg) CurMBB->addLiveIn(Reg);
				3825	}
				3826
				3827	// Insert the EHSELECTION instruction.
				3828	SDVTList VTs = DAG.getVTList(VT, MVT::Other);
				3829	SDValue Ops[2];
				3830	Ops[0] = getValue(I.getOperand(1));
				3831	Ops[1] = getRoot();
				3832	SDValue Op = DAG.getNode(ISD::EHSELECTION, VTs, Ops, 2);
				3833	setValue(&I, Op);
				3834	DAG.setRoot(Op.getValue(1));
				3835	} else {
				3836	setValue(&I, DAG.getConstant(0, VT));
				3837	}
				3838
				3839	return 0;
				3840	}
				3841
				3842	case Intrinsic::eh_typeid_for_i32:
				3843	case Intrinsic::eh_typeid_for_i64: {
				3844	MachineModuleInfo *MMI = DAG.getMachineModuleInfo();
				3845	MVT VT = (Intrinsic == Intrinsic::eh_typeid_for_i32 ?
				3846	MVT::i32 : MVT::i64);
Anton Korobeynikov	a0e8a1e	2008-09-08 21:13:56 +0000	[diff] [blame]	3847
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	3848	if (MMI) {
				3849	// Find the type id for the given typeinfo.
				3850	GlobalVariable *GV = ExtractTypeInfo(I.getOperand(1));
				3851
				3852	unsigned TypeID = MMI->getTypeIDFor(GV);
				3853	setValue(&I, DAG.getConstant(TypeID, VT));
				3854	} else {
				3855	// Return something different to eh_selector.
				3856	setValue(&I, DAG.getConstant(1, VT));
				3857	}
				3858
				3859	return 0;
				3860	}
				3861
Anton Korobeynikov	a0e8a1e	2008-09-08 21:13:56 +0000	[diff] [blame]	3862	case Intrinsic::eh_return_i32:
				3863	case Intrinsic::eh_return_i64:
				3864	if (MachineModuleInfo *MMI = DAG.getMachineModuleInfo()) {
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	3865	MMI->setCallsEHReturn(true);
				3866	DAG.setRoot(DAG.getNode(ISD::EH_RETURN,
				3867	MVT::Other,
				3868	getControlRoot(),
				3869	getValue(I.getOperand(1)),
				3870	getValue(I.getOperand(2))));
				3871	} else {
				3872	setValue(&I, DAG.getConstant(0, TLI.getPointerTy()));
				3873	}
				3874
				3875	return 0;
Anton Korobeynikov	a0e8a1e	2008-09-08 21:13:56 +0000	[diff] [blame]	3876	case Intrinsic::eh_unwind_init:
				3877	if (MachineModuleInfo *MMI = DAG.getMachineModuleInfo()) {
				3878	MMI->setCallsUnwindInit(true);
				3879	}
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	3880
Anton Korobeynikov	a0e8a1e	2008-09-08 21:13:56 +0000	[diff] [blame]	3881	return 0;
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	3882
Anton Korobeynikov	a0e8a1e	2008-09-08 21:13:56 +0000	[diff] [blame]	3883	case Intrinsic::eh_dwarf_cfa: {
				3884	MVT VT = getValue(I.getOperand(1)).getValueType();
				3885	SDValue CfaArg;
				3886	if (VT.bitsGT(TLI.getPointerTy()))
				3887	CfaArg = DAG.getNode(ISD::TRUNCATE,
				3888	TLI.getPointerTy(), getValue(I.getOperand(1)));
				3889	else
				3890	CfaArg = DAG.getNode(ISD::SIGN_EXTEND,
				3891	TLI.getPointerTy(), getValue(I.getOperand(1)));
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	3892
Anton Korobeynikov	a0e8a1e	2008-09-08 21:13:56 +0000	[diff] [blame]	3893	SDValue Offset = DAG.getNode(ISD::ADD,
				3894	TLI.getPointerTy(),
				3895	DAG.getNode(ISD::FRAME_TO_ARGS_OFFSET,
				3896	TLI.getPointerTy()),
				3897	CfaArg);
				3898	setValue(&I, DAG.getNode(ISD::ADD,
				3899	TLI.getPointerTy(),
				3900	DAG.getNode(ISD::FRAMEADDR,
				3901	TLI.getPointerTy(),
				3902	DAG.getConstant(0,
				3903	TLI.getPointerTy())),
				3904	Offset));
				3905	return 0;
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	3906	}
				3907
Mon P Wang	77cdf30	2008-11-10 20:54:11 +0000	[diff] [blame]	3908	case Intrinsic::convertff:
				3909	case Intrinsic::convertfsi:
				3910	case Intrinsic::convertfui:
				3911	case Intrinsic::convertsif:
				3912	case Intrinsic::convertuif:
				3913	case Intrinsic::convertss:
				3914	case Intrinsic::convertsu:
				3915	case Intrinsic::convertus:
				3916	case Intrinsic::convertuu: {
				3917	ISD::CvtCode Code = ISD::CVT_INVALID;
				3918	switch (Intrinsic) {
				3919	case Intrinsic::convertff: Code = ISD::CVT_FF; break;
				3920	case Intrinsic::convertfsi: Code = ISD::CVT_FS; break;
				3921	case Intrinsic::convertfui: Code = ISD::CVT_FU; break;
				3922	case Intrinsic::convertsif: Code = ISD::CVT_SF; break;
				3923	case Intrinsic::convertuif: Code = ISD::CVT_UF; break;
				3924	case Intrinsic::convertss: Code = ISD::CVT_SS; break;
				3925	case Intrinsic::convertsu: Code = ISD::CVT_SU; break;
				3926	case Intrinsic::convertus: Code = ISD::CVT_US; break;
				3927	case Intrinsic::convertuu: Code = ISD::CVT_UU; break;
				3928	}
				3929	MVT DestVT = TLI.getValueType(I.getType());
				3930	Value* Op1 = I.getOperand(1);
				3931	setValue(&I, DAG.getConvertRndSat(DestVT, getValue(Op1),
				3932	DAG.getValueType(DestVT),
				3933	DAG.getValueType(getValue(Op1).getValueType()),
				3934	getValue(I.getOperand(2)),
				3935	getValue(I.getOperand(3)),
				3936	Code));
				3937	return 0;
				3938	}
				3939
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	3940	case Intrinsic::sqrt:
				3941	setValue(&I, DAG.getNode(ISD::FSQRT,
				3942	getValue(I.getOperand(1)).getValueType(),
				3943	getValue(I.getOperand(1))));
				3944	return 0;
				3945	case Intrinsic::powi:
				3946	setValue(&I, DAG.getNode(ISD::FPOWI,
				3947	getValue(I.getOperand(1)).getValueType(),
				3948	getValue(I.getOperand(1)),
				3949	getValue(I.getOperand(2))));
				3950	return 0;
				3951	case Intrinsic::sin:
				3952	setValue(&I, DAG.getNode(ISD::FSIN,
				3953	getValue(I.getOperand(1)).getValueType(),
				3954	getValue(I.getOperand(1))));
				3955	return 0;
				3956	case Intrinsic::cos:
				3957	setValue(&I, DAG.getNode(ISD::FCOS,
				3958	getValue(I.getOperand(1)).getValueType(),
				3959	getValue(I.getOperand(1))));
				3960	return 0;
Dale Johannesen	7794f2a	2008-09-04 00:47:13 +0000	[diff] [blame]	3961	case Intrinsic::log:
Dale Johannesen	59e577f	2008-09-05 18:38:42 +0000	[diff] [blame]	3962	visitLog(I);
Dale Johannesen	7794f2a	2008-09-04 00:47:13 +0000	[diff] [blame]	3963	return 0;
				3964	case Intrinsic::log2:
Dale Johannesen	59e577f	2008-09-05 18:38:42 +0000	[diff] [blame]	3965	visitLog2(I);
Dale Johannesen	7794f2a	2008-09-04 00:47:13 +0000	[diff] [blame]	3966	return 0;
				3967	case Intrinsic::log10:
Dale Johannesen	59e577f	2008-09-05 18:38:42 +0000	[diff] [blame]	3968	visitLog10(I);
Dale Johannesen	7794f2a	2008-09-04 00:47:13 +0000	[diff] [blame]	3969	return 0;
				3970	case Intrinsic::exp:
Dale Johannesen	59e577f	2008-09-05 18:38:42 +0000	[diff] [blame]	3971	visitExp(I);
Dale Johannesen	7794f2a	2008-09-04 00:47:13 +0000	[diff] [blame]	3972	return 0;
				3973	case Intrinsic::exp2:
Dale Johannesen	601d3c0	2008-09-05 01:48:15 +0000	[diff] [blame]	3974	visitExp2(I);
Dale Johannesen	7794f2a	2008-09-04 00:47:13 +0000	[diff] [blame]	3975	return 0;
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	3976	case Intrinsic::pow:
Bill Wendling	aeb5c7b	2008-09-10 00:20:20 +0000	[diff] [blame]	3977	visitPow(I);
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	3978	return 0;
				3979	case Intrinsic::pcmarker: {
				3980	SDValue Tmp = getValue(I.getOperand(1));
				3981	DAG.setRoot(DAG.getNode(ISD::PCMARKER, MVT::Other, getRoot(), Tmp));
				3982	return 0;
				3983	}
				3984	case Intrinsic::readcyclecounter: {
				3985	SDValue Op = getRoot();
				3986	SDValue Tmp = DAG.getNode(ISD::READCYCLECOUNTER,
				3987	DAG.getNodeValueTypes(MVT::i64, MVT::Other), 2,
				3988	&Op, 1);
				3989	setValue(&I, Tmp);
				3990	DAG.setRoot(Tmp.getValue(1));
				3991	return 0;
				3992	}
				3993	case Intrinsic::part_select: {
				3994	// Currently not implemented: just abort
				3995	assert(0 && "part_select intrinsic not implemented");
				3996	abort();
				3997	}
				3998	case Intrinsic::part_set: {
				3999	// Currently not implemented: just abort
				4000	assert(0 && "part_set intrinsic not implemented");
				4001	abort();
				4002	}
				4003	case Intrinsic::bswap:
				4004	setValue(&I, DAG.getNode(ISD::BSWAP,
				4005	getValue(I.getOperand(1)).getValueType(),
				4006	getValue(I.getOperand(1))));
				4007	return 0;
				4008	case Intrinsic::cttz: {
				4009	SDValue Arg = getValue(I.getOperand(1));
				4010	MVT Ty = Arg.getValueType();
				4011	SDValue result = DAG.getNode(ISD::CTTZ, Ty, Arg);
				4012	setValue(&I, result);
				4013	return 0;
				4014	}
				4015	case Intrinsic::ctlz: {
				4016	SDValue Arg = getValue(I.getOperand(1));
				4017	MVT Ty = Arg.getValueType();
				4018	SDValue result = DAG.getNode(ISD::CTLZ, Ty, Arg);
				4019	setValue(&I, result);
				4020	return 0;
				4021	}
				4022	case Intrinsic::ctpop: {
				4023	SDValue Arg = getValue(I.getOperand(1));
				4024	MVT Ty = Arg.getValueType();
				4025	SDValue result = DAG.getNode(ISD::CTPOP, Ty, Arg);
				4026	setValue(&I, result);
				4027	return 0;
				4028	}
				4029	case Intrinsic::stacksave: {
				4030	SDValue Op = getRoot();
				4031	SDValue Tmp = DAG.getNode(ISD::STACKSAVE,
				4032	DAG.getNodeValueTypes(TLI.getPointerTy(), MVT::Other), 2, &Op, 1);
				4033	setValue(&I, Tmp);
				4034	DAG.setRoot(Tmp.getValue(1));
				4035	return 0;
				4036	}
				4037	case Intrinsic::stackrestore: {
				4038	SDValue Tmp = getValue(I.getOperand(1));
				4039	DAG.setRoot(DAG.getNode(ISD::STACKRESTORE, MVT::Other, getRoot(), Tmp));
				4040	return 0;
				4041	}
Bill Wendling	5734450	2008-11-18 11:01:33 +0000	[diff] [blame]	4042	case Intrinsic::stackprotector: {
Bill Wendling	b2a4298	2008-11-06 02:29:10 +0000	[diff] [blame]	4043	// Emit code into the DAG to store the stack guard onto the stack.
				4044	MachineFunction &MF = DAG.getMachineFunction();
				4045	MachineFrameInfo *MFI = MF.getFrameInfo();
				4046	MVT PtrTy = TLI.getPointerTy();
				4047
Bill Wendling	b7c6ebc	2008-11-07 01:23:58 +0000	[diff] [blame]	4048	SDValue Src = getValue(I.getOperand(1)); // The guard's value.
				4049	AllocaInst *Slot = cast<AllocaInst>(I.getOperand(2));
Bill Wendling	b2a4298	2008-11-06 02:29:10 +0000	[diff] [blame]	4050
Bill Wendling	b7c6ebc	2008-11-07 01:23:58 +0000	[diff] [blame]	4051	int FI = FuncInfo.StaticAllocaMap[Slot];
Bill Wendling	b2a4298	2008-11-06 02:29:10 +0000	[diff] [blame]	4052	MFI->setStackProtectorIndex(FI);
				4053
				4054	SDValue FIN = DAG.getFrameIndex(FI, PtrTy);
				4055
				4056	// Store the stack protector onto the stack.
				4057	SDValue Result = DAG.getStore(getRoot(), Src, FIN,
				4058	PseudoSourceValue::getFixedStack(FI),
				4059	0, true);
				4060	setValue(&I, Result);
				4061	DAG.setRoot(Result);
				4062	return 0;
				4063	}
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	4064	case Intrinsic::var_annotation:
				4065	// Discard annotate attributes
				4066	return 0;
				4067
				4068	case Intrinsic::init_trampoline: {
				4069	const Function *F = cast<Function>(I.getOperand(2)->stripPointerCasts());
				4070
				4071	SDValue Ops[6];
				4072	Ops[0] = getRoot();
				4073	Ops[1] = getValue(I.getOperand(1));
				4074	Ops[2] = getValue(I.getOperand(2));
				4075	Ops[3] = getValue(I.getOperand(3));
				4076	Ops[4] = DAG.getSrcValue(I.getOperand(1));
				4077	Ops[5] = DAG.getSrcValue(F);
				4078
				4079	SDValue Tmp = DAG.getNode(ISD::TRAMPOLINE,
				4080	DAG.getNodeValueTypes(TLI.getPointerTy(),
				4081	MVT::Other), 2,
				4082	Ops, 6);
				4083
				4084	setValue(&I, Tmp);
				4085	DAG.setRoot(Tmp.getValue(1));
				4086	return 0;
				4087	}
				4088
				4089	case Intrinsic::gcroot:
				4090	if (GFI) {
				4091	Value *Alloca = I.getOperand(1);
				4092	Constant *TypeMap = cast<Constant>(I.getOperand(2));
				4093
				4094	FrameIndexSDNode *FI = cast<FrameIndexSDNode>(getValue(Alloca).getNode());
				4095	GFI->addStackRoot(FI->getIndex(), TypeMap);
				4096	}
				4097	return 0;
				4098
				4099	case Intrinsic::gcread:
				4100	case Intrinsic::gcwrite:
				4101	assert(0 && "GC failed to lower gcread/gcwrite intrinsics!");
				4102	return 0;
				4103
				4104	case Intrinsic::flt_rounds: {
				4105	setValue(&I, DAG.getNode(ISD::FLT_ROUNDS_, MVT::i32));
				4106	return 0;
				4107	}
				4108
				4109	case Intrinsic::trap: {
				4110	DAG.setRoot(DAG.getNode(ISD::TRAP, MVT::Other, getRoot()));
				4111	return 0;
				4112	}
Bill Wendling	7cdc3c8	2008-11-21 02:03:52 +0000	[diff] [blame]	4113
Bill Wendling	ef37546	2008-11-21 02:38:44 +0000	[diff] [blame]	4114	case Intrinsic::uadd_with_overflow:
Bill Wendling	74c3765	2008-12-09 22:08:41 +0000	[diff] [blame]	4115	return implVisitAluOverflow(I, ISD::UADDO);
				4116	case Intrinsic::sadd_with_overflow:
				4117	return implVisitAluOverflow(I, ISD::SADDO);
				4118	case Intrinsic::usub_with_overflow:
				4119	return implVisitAluOverflow(I, ISD::USUBO);
				4120	case Intrinsic::ssub_with_overflow:
				4121	return implVisitAluOverflow(I, ISD::SSUBO);
				4122	case Intrinsic::umul_with_overflow:
				4123	return implVisitAluOverflow(I, ISD::UMULO);
				4124	case Intrinsic::smul_with_overflow:
				4125	return implVisitAluOverflow(I, ISD::SMULO);
Bill Wendling	7cdc3c8	2008-11-21 02:03:52 +0000	[diff] [blame]	4126
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	4127	case Intrinsic::prefetch: {
				4128	SDValue Ops[4];
				4129	Ops[0] = getRoot();
				4130	Ops[1] = getValue(I.getOperand(1));
				4131	Ops[2] = getValue(I.getOperand(2));
				4132	Ops[3] = getValue(I.getOperand(3));
				4133	DAG.setRoot(DAG.getNode(ISD::PREFETCH, MVT::Other, &Ops[0], 4));
				4134	return 0;
				4135	}
				4136
				4137	case Intrinsic::memory_barrier: {
				4138	SDValue Ops[6];
				4139	Ops[0] = getRoot();
				4140	for (int x = 1; x < 6; ++x)
				4141	Ops[x] = getValue(I.getOperand(x));
				4142
				4143	DAG.setRoot(DAG.getNode(ISD::MEMBARRIER, MVT::Other, &Ops[0], 6));
				4144	return 0;
				4145	}
				4146	case Intrinsic::atomic_cmp_swap: {
				4147	SDValue Root = getRoot();
				4148	SDValue L;
				4149	switch (getValue(I.getOperand(2)).getValueType().getSimpleVT()) {
				4150	case MVT::i8:
				4151	L = DAG.getAtomic(ISD::ATOMIC_CMP_SWAP_8, Root,
				4152	getValue(I.getOperand(1)),
				4153	getValue(I.getOperand(2)),
				4154	getValue(I.getOperand(3)),
				4155	I.getOperand(1));
				4156	break;
				4157	case MVT::i16:
				4158	L = DAG.getAtomic(ISD::ATOMIC_CMP_SWAP_16, Root,
				4159	getValue(I.getOperand(1)),
				4160	getValue(I.getOperand(2)),
				4161	getValue(I.getOperand(3)),
				4162	I.getOperand(1));
				4163	break;
				4164	case MVT::i32:
				4165	L = DAG.getAtomic(ISD::ATOMIC_CMP_SWAP_32, Root,
				4166	getValue(I.getOperand(1)),
				4167	getValue(I.getOperand(2)),
				4168	getValue(I.getOperand(3)),
				4169	I.getOperand(1));
				4170	break;
				4171	case MVT::i64:
				4172	L = DAG.getAtomic(ISD::ATOMIC_CMP_SWAP_64, Root,
				4173	getValue(I.getOperand(1)),
				4174	getValue(I.getOperand(2)),
				4175	getValue(I.getOperand(3)),
				4176	I.getOperand(1));
				4177	break;
				4178	default:
				4179	assert(0 && "Invalid atomic type");
				4180	abort();
				4181	}
				4182	setValue(&I, L);
				4183	DAG.setRoot(L.getValue(1));
				4184	return 0;
				4185	}
				4186	case Intrinsic::atomic_load_add:
				4187	switch (getValue(I.getOperand(2)).getValueType().getSimpleVT()) {
				4188	case MVT::i8:
				4189	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_ADD_8);
				4190	case MVT::i16:
				4191	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_ADD_16);
				4192	case MVT::i32:
				4193	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_ADD_32);
				4194	case MVT::i64:
				4195	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_ADD_64);
				4196	default:
				4197	assert(0 && "Invalid atomic type");
				4198	abort();
				4199	}
				4200	case Intrinsic::atomic_load_sub:
				4201	switch (getValue(I.getOperand(2)).getValueType().getSimpleVT()) {
				4202	case MVT::i8:
				4203	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_SUB_8);
				4204	case MVT::i16:
				4205	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_SUB_16);
				4206	case MVT::i32:
				4207	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_SUB_32);
				4208	case MVT::i64:
				4209	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_SUB_64);
				4210	default:
				4211	assert(0 && "Invalid atomic type");
				4212	abort();
				4213	}
				4214	case Intrinsic::atomic_load_or:
				4215	switch (getValue(I.getOperand(2)).getValueType().getSimpleVT()) {
				4216	case MVT::i8:
				4217	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_OR_8);
				4218	case MVT::i16:
				4219	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_OR_16);
				4220	case MVT::i32:
				4221	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_OR_32);
				4222	case MVT::i64:
				4223	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_OR_64);
				4224	default:
				4225	assert(0 && "Invalid atomic type");
				4226	abort();
				4227	}
				4228	case Intrinsic::atomic_load_xor:
				4229	switch (getValue(I.getOperand(2)).getValueType().getSimpleVT()) {
				4230	case MVT::i8:
				4231	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_XOR_8);
				4232	case MVT::i16:
				4233	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_XOR_16);
				4234	case MVT::i32:
				4235	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_XOR_32);
				4236	case MVT::i64:
				4237	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_XOR_64);
				4238	default:
				4239	assert(0 && "Invalid atomic type");
				4240	abort();
				4241	}
				4242	case Intrinsic::atomic_load_and:
				4243	switch (getValue(I.getOperand(2)).getValueType().getSimpleVT()) {
				4244	case MVT::i8:
				4245	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_AND_8);
				4246	case MVT::i16:
				4247	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_AND_16);
				4248	case MVT::i32:
				4249	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_AND_32);
				4250	case MVT::i64:
				4251	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_AND_64);
				4252	default:
				4253	assert(0 && "Invalid atomic type");
				4254	abort();
				4255	}
				4256	case Intrinsic::atomic_load_nand:
				4257	switch (getValue(I.getOperand(2)).getValueType().getSimpleVT()) {
				4258	case MVT::i8:
				4259	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_NAND_8);
				4260	case MVT::i16:
				4261	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_NAND_16);
				4262	case MVT::i32:
				4263	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_NAND_32);
				4264	case MVT::i64:
				4265	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_NAND_64);
				4266	default:
				4267	assert(0 && "Invalid atomic type");
				4268	abort();
				4269	}
				4270	case Intrinsic::atomic_load_max:
				4271	switch (getValue(I.getOperand(2)).getValueType().getSimpleVT()) {
				4272	case MVT::i8:
				4273	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_MAX_8);
				4274	case MVT::i16:
				4275	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_MAX_16);
				4276	case MVT::i32:
				4277	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_MAX_32);
				4278	case MVT::i64:
				4279	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_MAX_64);
				4280	default:
				4281	assert(0 && "Invalid atomic type");
				4282	abort();
				4283	}
				4284	case Intrinsic::atomic_load_min:
				4285	switch (getValue(I.getOperand(2)).getValueType().getSimpleVT()) {
				4286	case MVT::i8:
				4287	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_MIN_8);
				4288	case MVT::i16:
				4289	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_MIN_16);
				4290	case MVT::i32:
				4291	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_MIN_32);
				4292	case MVT::i64:
				4293	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_MIN_64);
				4294	default:
				4295	assert(0 && "Invalid atomic type");
				4296	abort();
				4297	}
				4298	case Intrinsic::atomic_load_umin:
				4299	switch (getValue(I.getOperand(2)).getValueType().getSimpleVT()) {
				4300	case MVT::i8:
				4301	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_UMIN_8);
				4302	case MVT::i16:
				4303	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_UMIN_16);
				4304	case MVT::i32:
				4305	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_UMIN_32);
				4306	case MVT::i64:
				4307	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_UMIN_64);
				4308	default:
				4309	assert(0 && "Invalid atomic type");
				4310	abort();
				4311	}
				4312	case Intrinsic::atomic_load_umax:
				4313	switch (getValue(I.getOperand(2)).getValueType().getSimpleVT()) {
				4314	case MVT::i8:
				4315	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_UMAX_8);
				4316	case MVT::i16:
				4317	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_UMAX_16);
				4318	case MVT::i32:
				4319	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_UMAX_32);
				4320	case MVT::i64:
				4321	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_UMAX_64);
				4322	default:
				4323	assert(0 && "Invalid atomic type");
				4324	abort();
				4325	}
				4326	case Intrinsic::atomic_swap:
				4327	switch (getValue(I.getOperand(2)).getValueType().getSimpleVT()) {
				4328	case MVT::i8:
				4329	return implVisitBinaryAtomic(I, ISD::ATOMIC_SWAP_8);
				4330	case MVT::i16:
				4331	return implVisitBinaryAtomic(I, ISD::ATOMIC_SWAP_16);
				4332	case MVT::i32:
				4333	return implVisitBinaryAtomic(I, ISD::ATOMIC_SWAP_32);
				4334	case MVT::i64:
				4335	return implVisitBinaryAtomic(I, ISD::ATOMIC_SWAP_64);
				4336	default:
				4337	assert(0 && "Invalid atomic type");
				4338	abort();
				4339	}
				4340	}
				4341	}
				4342
				4343
				4344	void SelectionDAGLowering::LowerCallTo(CallSite CS, SDValue Callee,
				4345	bool IsTailCall,
				4346	MachineBasicBlock *LandingPad) {
				4347	const PointerType *PT = cast<PointerType>(CS.getCalledValue()->getType());
				4348	const FunctionType *FTy = cast<FunctionType>(PT->getElementType());
				4349	MachineModuleInfo *MMI = DAG.getMachineModuleInfo();
				4350	unsigned BeginLabel = 0, EndLabel = 0;
				4351
				4352	TargetLowering::ArgListTy Args;
				4353	TargetLowering::ArgListEntry Entry;
				4354	Args.reserve(CS.arg_size());
				4355	for (CallSite::arg_iterator i = CS.arg_begin(), e = CS.arg_end();
				4356	i != e; ++i) {
				4357	SDValue ArgNode = getValue(*i);
				4358	Entry.Node = ArgNode; Entry.Ty = (*i)->getType();
				4359
				4360	unsigned attrInd = i - CS.arg_begin() + 1;
Devang Patel	0598866	2008-09-25 21:00:45 +0000	[diff] [blame]	4361	Entry.isSExt = CS.paramHasAttr(attrInd, Attribute::SExt);
				4362	Entry.isZExt = CS.paramHasAttr(attrInd, Attribute::ZExt);
				4363	Entry.isInReg = CS.paramHasAttr(attrInd, Attribute::InReg);
				4364	Entry.isSRet = CS.paramHasAttr(attrInd, Attribute::StructRet);
				4365	Entry.isNest = CS.paramHasAttr(attrInd, Attribute::Nest);
				4366	Entry.isByVal = CS.paramHasAttr(attrInd, Attribute::ByVal);
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	4367	Entry.Alignment = CS.getParamAlignment(attrInd);
				4368	Args.push_back(Entry);
				4369	}
				4370
				4371	if (LandingPad && MMI) {
				4372	// Insert a label before the invoke call to mark the try range. This can be
				4373	// used to detect deletion of the invoke via the MachineModuleInfo.
				4374	BeginLabel = MMI->NextLabelID();
				4375	// Both PendingLoads and PendingExports must be flushed here;
				4376	// this call might not return.
				4377	(void)getRoot();
				4378	DAG.setRoot(DAG.getLabel(ISD::EH_LABEL, getControlRoot(), BeginLabel));
				4379	}
				4380
				4381	std::pair<SDValue,SDValue> Result =
				4382	TLI.LowerCallTo(getRoot(), CS.getType(),
Devang Patel	0598866	2008-09-25 21:00:45 +0000	[diff] [blame]	4383	CS.paramHasAttr(0, Attribute::SExt),
Dale Johannesen	86098bd	2008-09-26 19:31:26 +0000	[diff] [blame]	4384	CS.paramHasAttr(0, Attribute::ZExt), FTy->isVarArg(),
				4385	CS.paramHasAttr(0, Attribute::InReg),
				4386	CS.getCallingConv(),
Dan Gohman	1937e2f	2008-09-16 01:42:28 +0000	[diff] [blame]	4387	IsTailCall && PerformTailCallOpt,
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	4388	Callee, Args, DAG);
				4389	if (CS.getType() != Type::VoidTy)
				4390	setValue(CS.getInstruction(), Result.first);
				4391	DAG.setRoot(Result.second);
				4392
				4393	if (LandingPad && MMI) {
				4394	// Insert a label at the end of the invoke call to mark the try range. This
				4395	// can be used to detect deletion of the invoke via the MachineModuleInfo.
				4396	EndLabel = MMI->NextLabelID();
				4397	DAG.setRoot(DAG.getLabel(ISD::EH_LABEL, getRoot(), EndLabel));
				4398
				4399	// Inform MachineModuleInfo of range.
				4400	MMI->addInvoke(LandingPad, BeginLabel, EndLabel);
				4401	}
				4402	}
				4403
				4404
				4405	void SelectionDAGLowering::visitCall(CallInst &I) {
				4406	const char *RenameFn = 0;
				4407	if (Function *F = I.getCalledFunction()) {
				4408	if (F->isDeclaration()) {
				4409	if (unsigned IID = F->getIntrinsicID()) {
				4410	RenameFn = visitIntrinsicCall(I, IID);
				4411	if (!RenameFn)
				4412	return;
				4413	}
				4414	}
				4415
				4416	// Check for well-known libc/libm calls. If the function is internal, it
				4417	// can't be a library call.
				4418	unsigned NameLen = F->getNameLen();
				4419	if (!F->hasInternalLinkage() && NameLen) {
				4420	const char *NameStr = F->getNameStart();
				4421	if (NameStr[0] == 'c' &&
				4422	((NameLen == 8 && !strcmp(NameStr, "copysign")) \|\|
				4423	(NameLen == 9 && !strcmp(NameStr, "copysignf")))) {
				4424	if (I.getNumOperands() == 3 && // Basic sanity checks.
				4425	I.getOperand(1)->getType()->isFloatingPoint() &&
				4426	I.getType() == I.getOperand(1)->getType() &&
				4427	I.getType() == I.getOperand(2)->getType()) {
				4428	SDValue LHS = getValue(I.getOperand(1));
				4429	SDValue RHS = getValue(I.getOperand(2));
				4430	setValue(&I, DAG.getNode(ISD::FCOPYSIGN, LHS.getValueType(),
				4431	LHS, RHS));
				4432	return;
				4433	}
				4434	} else if (NameStr[0] == 'f' &&
				4435	((NameLen == 4 && !strcmp(NameStr, "fabs")) \|\|
				4436	(NameLen == 5 && !strcmp(NameStr, "fabsf")) \|\|
				4437	(NameLen == 5 && !strcmp(NameStr, "fabsl")))) {
				4438	if (I.getNumOperands() == 2 && // Basic sanity checks.
				4439	I.getOperand(1)->getType()->isFloatingPoint() &&
				4440	I.getType() == I.getOperand(1)->getType()) {
				4441	SDValue Tmp = getValue(I.getOperand(1));
				4442	setValue(&I, DAG.getNode(ISD::FABS, Tmp.getValueType(), Tmp));
				4443	return;
				4444	}
				4445	} else if (NameStr[0] == 's' &&
				4446	((NameLen == 3 && !strcmp(NameStr, "sin")) \|\|
				4447	(NameLen == 4 && !strcmp(NameStr, "sinf")) \|\|
				4448	(NameLen == 4 && !strcmp(NameStr, "sinl")))) {
				4449	if (I.getNumOperands() == 2 && // Basic sanity checks.
				4450	I.getOperand(1)->getType()->isFloatingPoint() &&
				4451	I.getType() == I.getOperand(1)->getType()) {
				4452	SDValue Tmp = getValue(I.getOperand(1));
				4453	setValue(&I, DAG.getNode(ISD::FSIN, Tmp.getValueType(), Tmp));
				4454	return;
				4455	}
				4456	} else if (NameStr[0] == 'c' &&
				4457	((NameLen == 3 && !strcmp(NameStr, "cos")) \|\|
				4458	(NameLen == 4 && !strcmp(NameStr, "cosf")) \|\|
				4459	(NameLen == 4 && !strcmp(NameStr, "cosl")))) {
				4460	if (I.getNumOperands() == 2 && // Basic sanity checks.
				4461	I.getOperand(1)->getType()->isFloatingPoint() &&
				4462	I.getType() == I.getOperand(1)->getType()) {
				4463	SDValue Tmp = getValue(I.getOperand(1));
				4464	setValue(&I, DAG.getNode(ISD::FCOS, Tmp.getValueType(), Tmp));
				4465	return;
				4466	}
				4467	}
				4468	}
				4469	} else if (isa<InlineAsm>(I.getOperand(0))) {
				4470	visitInlineAsm(&I);
				4471	return;
				4472	}
				4473
				4474	SDValue Callee;
				4475	if (!RenameFn)
				4476	Callee = getValue(I.getOperand(0));
				4477	else
Bill Wendling	056292f	2008-09-16 21:48:12 +0000	[diff] [blame]	4478	Callee = DAG.getExternalSymbol(RenameFn, TLI.getPointerTy());
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	4479
				4480	LowerCallTo(&I, Callee, I.isTailCall());
				4481	}
				4482
				4483
				4484	/// getCopyFromRegs - Emit a series of CopyFromReg nodes that copies from
				4485	/// this value and returns the result as a ValueVT value. This uses
				4486	/// Chain/Flag as the input and updates them for the output Chain/Flag.
				4487	/// If the Flag pointer is NULL, no flag is used.
				4488	SDValue RegsForValue::getCopyFromRegs(SelectionDAG &DAG,
				4489	SDValue &Chain,
				4490	SDValue *Flag) const {
				4491	// Assemble the legal parts into the final values.
				4492	SmallVector<SDValue, 4> Values(ValueVTs.size());
				4493	SmallVector<SDValue, 8> Parts;
				4494	for (unsigned Value = 0, Part = 0, e = ValueVTs.size(); Value != e; ++Value) {
				4495	// Copy the legal parts from the registers.
				4496	MVT ValueVT = ValueVTs[Value];
				4497	unsigned NumRegs = TLI->getNumRegisters(ValueVT);
				4498	MVT RegisterVT = RegVTs[Value];
				4499
				4500	Parts.resize(NumRegs);
				4501	for (unsigned i = 0; i != NumRegs; ++i) {
				4502	SDValue P;
				4503	if (Flag == 0)
				4504	P = DAG.getCopyFromReg(Chain, Regs[Part+i], RegisterVT);
				4505	else {
				4506	P = DAG.getCopyFromReg(Chain, Regs[Part+i], RegisterVT, *Flag);
				4507	*Flag = P.getValue(2);
				4508	}
				4509	Chain = P.getValue(1);
				4510
				4511	// If the source register was virtual and if we know something about it,
				4512	// add an assert node.
				4513	if (TargetRegisterInfo::isVirtualRegister(Regs[Part+i]) &&
				4514	RegisterVT.isInteger() && !RegisterVT.isVector()) {
				4515	unsigned SlotNo = Regs[Part+i]-TargetRegisterInfo::FirstVirtualRegister;
				4516	FunctionLoweringInfo &FLI = DAG.getFunctionLoweringInfo();
				4517	if (FLI.LiveOutRegInfo.size() > SlotNo) {
				4518	FunctionLoweringInfo::LiveOutInfo &LOI = FLI.LiveOutRegInfo[SlotNo];
				4519
				4520	unsigned RegSize = RegisterVT.getSizeInBits();
				4521	unsigned NumSignBits = LOI.NumSignBits;
				4522	unsigned NumZeroBits = LOI.KnownZero.countLeadingOnes();
				4523
				4524	// FIXME: We capture more information than the dag can represent. For
				4525	// now, just use the tightest assertzext/assertsext possible.
				4526	bool isSExt = true;
				4527	MVT FromVT(MVT::Other);
				4528	if (NumSignBits == RegSize)
				4529	isSExt = true, FromVT = MVT::i1; // ASSERT SEXT 1
				4530	else if (NumZeroBits >= RegSize-1)
				4531	isSExt = false, FromVT = MVT::i1; // ASSERT ZEXT 1
				4532	else if (NumSignBits > RegSize-8)
				4533	isSExt = true, FromVT = MVT::i8; // ASSERT SEXT 8
				4534	else if (NumZeroBits >= RegSize-9)
				4535	isSExt = false, FromVT = MVT::i8; // ASSERT ZEXT 8
				4536	else if (NumSignBits > RegSize-16)
Bill Wendling	181b627	2008-10-19 20:34:04 +0000	[diff] [blame]	4537	isSExt = true, FromVT = MVT::i16; // ASSERT SEXT 16
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	4538	else if (NumZeroBits >= RegSize-17)
Bill Wendling	181b627	2008-10-19 20:34:04 +0000	[diff] [blame]	4539	isSExt = false, FromVT = MVT::i16; // ASSERT ZEXT 16
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	4540	else if (NumSignBits > RegSize-32)
Bill Wendling	181b627	2008-10-19 20:34:04 +0000	[diff] [blame]	4541	isSExt = true, FromVT = MVT::i32; // ASSERT SEXT 32
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	4542	else if (NumZeroBits >= RegSize-33)
Bill Wendling	181b627	2008-10-19 20:34:04 +0000	[diff] [blame]	4543	isSExt = false, FromVT = MVT::i32; // ASSERT ZEXT 32
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	4544
				4545	if (FromVT != MVT::Other) {
				4546	P = DAG.getNode(isSExt ? ISD::AssertSext : ISD::AssertZext,
				4547	RegisterVT, P, DAG.getValueType(FromVT));
				4548
				4549	}
				4550	}
				4551	}
				4552
				4553	Parts[i] = P;
				4554	}
				4555
				4556	Values[Value] = getCopyFromParts(DAG, Parts.begin(), NumRegs, RegisterVT,
				4557	ValueVT);
				4558	Part += NumRegs;
				4559	Parts.clear();
				4560	}
				4561
Duncan Sands	aaffa05	2008-12-01 11:41:29 +0000	[diff] [blame]	4562	return DAG.getNode(ISD::MERGE_VALUES,
				4563	DAG.getVTList(&ValueVTs[0], ValueVTs.size()),
				4564	&Values[0], ValueVTs.size());
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	4565	}
				4566
				4567	/// getCopyToRegs - Emit a series of CopyToReg nodes that copies the
				4568	/// specified value into the registers specified by this object. This uses
				4569	/// Chain/Flag as the input and updates them for the output Chain/Flag.
				4570	/// If the Flag pointer is NULL, no flag is used.
				4571	void RegsForValue::getCopyToRegs(SDValue Val, SelectionDAG &DAG,
				4572	SDValue &Chain, SDValue *Flag) const {
				4573	// Get the list of the values's legal parts.
				4574	unsigned NumRegs = Regs.size();
				4575	SmallVector<SDValue, 8> Parts(NumRegs);
				4576	for (unsigned Value = 0, Part = 0, e = ValueVTs.size(); Value != e; ++Value) {
				4577	MVT ValueVT = ValueVTs[Value];
				4578	unsigned NumParts = TLI->getNumRegisters(ValueVT);
				4579	MVT RegisterVT = RegVTs[Value];
				4580
				4581	getCopyToParts(DAG, Val.getValue(Val.getResNo() + Value),
				4582	&Parts[Part], NumParts, RegisterVT);
				4583	Part += NumParts;
				4584	}
				4585
				4586	// Copy the parts into the registers.
				4587	SmallVector<SDValue, 8> Chains(NumRegs);
				4588	for (unsigned i = 0; i != NumRegs; ++i) {
				4589	SDValue Part;
				4590	if (Flag == 0)
				4591	Part = DAG.getCopyToReg(Chain, Regs[i], Parts[i]);
				4592	else {
				4593	Part = DAG.getCopyToReg(Chain, Regs[i], Parts[i], *Flag);
				4594	*Flag = Part.getValue(1);
				4595	}
				4596	Chains[i] = Part.getValue(0);
				4597	}
				4598
				4599	if (NumRegs == 1 \|\| Flag)
				4600	// If NumRegs > 1 && Flag is used then the use of the last CopyToReg is
				4601	// flagged to it. That is the CopyToReg nodes and the user are considered
				4602	// a single scheduling unit. If we create a TokenFactor and return it as
				4603	// chain, then the TokenFactor is both a predecessor (operand) of the
				4604	// user as well as a successor (the TF operands are flagged to the user).
				4605	// c1, f1 = CopyToReg
				4606	// c2, f2 = CopyToReg
				4607	// c3 = TokenFactor c1, c2
				4608	// ...
				4609	// = op c3, ..., f2
				4610	Chain = Chains[NumRegs-1];
				4611	else
				4612	Chain = DAG.getNode(ISD::TokenFactor, MVT::Other, &Chains[0], NumRegs);
				4613	}
				4614
				4615	/// AddInlineAsmOperands - Add this value to the specified inlineasm node
				4616	/// operand list. This adds the code marker and includes the number of
				4617	/// values added into it.
				4618	void RegsForValue::AddInlineAsmOperands(unsigned Code, SelectionDAG &DAG,
				4619	std::vector<SDValue> &Ops) const {
				4620	MVT IntPtrTy = DAG.getTargetLoweringInfo().getPointerTy();
				4621	Ops.push_back(DAG.getTargetConstant(Code \| (Regs.size() << 3), IntPtrTy));
				4622	for (unsigned Value = 0, Reg = 0, e = ValueVTs.size(); Value != e; ++Value) {
				4623	unsigned NumRegs = TLI->getNumRegisters(ValueVTs[Value]);
				4624	MVT RegisterVT = RegVTs[Value];
Chris Lattner	58f15c4	2008-10-17 16:21:11 +0000	[diff] [blame]	4625	for (unsigned i = 0; i != NumRegs; ++i) {
				4626	assert(Reg < Regs.size() && "Mismatch in # registers expected");
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	4627	Ops.push_back(DAG.getRegister(Regs[Reg++], RegisterVT));
Chris Lattner	58f15c4	2008-10-17 16:21:11 +0000	[diff] [blame]	4628	}
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	4629	}
				4630	}
				4631
				4632	/// isAllocatableRegister - If the specified register is safe to allocate,
				4633	/// i.e. it isn't a stack pointer or some other special register, return the
				4634	/// register class for the register. Otherwise, return null.
				4635	static const TargetRegisterClass *
				4636	isAllocatableRegister(unsigned Reg, MachineFunction &MF,
				4637	const TargetLowering &TLI,
				4638	const TargetRegisterInfo *TRI) {
				4639	MVT FoundVT = MVT::Other;
				4640	const TargetRegisterClass *FoundRC = 0;
				4641	for (TargetRegisterInfo::regclass_iterator RCI = TRI->regclass_begin(),
				4642	E = TRI->regclass_end(); RCI != E; ++RCI) {
				4643	MVT ThisVT = MVT::Other;
				4644
				4645	const TargetRegisterClass RC = RCI;
				4646	// If none of the the value types for this register class are valid, we
				4647	// can't use it. For example, 64-bit reg classes on 32-bit targets.
				4648	for (TargetRegisterClass::vt_iterator I = RC->vt_begin(), E = RC->vt_end();
				4649	I != E; ++I) {
				4650	if (TLI.isTypeLegal(*I)) {
				4651	// If we have already found this register in a different register class,
				4652	// choose the one with the largest VT specified. For example, on
				4653	// PowerPC, we favor f64 register classes over f32.
				4654	if (FoundVT == MVT::Other \|\| FoundVT.bitsLT(*I)) {
				4655	ThisVT = *I;
				4656	break;
				4657	}
				4658	}
				4659	}
				4660
				4661	if (ThisVT == MVT::Other) continue;
				4662
				4663	// NOTE: This isn't ideal. In particular, this might allocate the
				4664	// frame pointer in functions that need it (due to them not being taken
				4665	// out of allocation, because a variable sized allocation hasn't been seen
				4666	// yet). This is a slight code pessimization, but should still work.
				4667	for (TargetRegisterClass::iterator I = RC->allocation_order_begin(MF),
				4668	E = RC->allocation_order_end(MF); I != E; ++I)
				4669	if (*I == Reg) {
				4670	// We found a matching register class. Keep looking at others in case
				4671	// we find one with larger registers that this physreg is also in.
				4672	FoundRC = RC;
				4673	FoundVT = ThisVT;
				4674	break;
				4675	}
				4676	}
				4677	return FoundRC;
				4678	}
				4679
				4680
				4681	namespace llvm {
				4682	/// AsmOperandInfo - This contains information for each constraint that we are
				4683	/// lowering.
Daniel Dunbar	c0c3b9a	2008-09-10 04:16:29 +0000	[diff] [blame]	4684	struct VISIBILITY_HIDDEN SDISelAsmOperandInfo :
				4685	public TargetLowering::AsmOperandInfo {
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	4686	/// CallOperand - If this is the result output operand or a clobber
				4687	/// this is null, otherwise it is the incoming operand to the CallInst.
				4688	/// This gets modified as the asm is processed.
				4689	SDValue CallOperand;
				4690
				4691	/// AssignedRegs - If this is a register or register class operand, this
				4692	/// contains the set of register corresponding to the operand.
				4693	RegsForValue AssignedRegs;
				4694
				4695	explicit SDISelAsmOperandInfo(const InlineAsm::ConstraintInfo &info)
				4696	: TargetLowering::AsmOperandInfo(info), CallOperand(0,0) {
				4697	}
				4698
				4699	/// MarkAllocatedRegs - Once AssignedRegs is set, mark the assigned registers
				4700	/// busy in OutputRegs/InputRegs.
				4701	void MarkAllocatedRegs(bool isOutReg, bool isInReg,
				4702	std::set<unsigned> &OutputRegs,
				4703	std::set<unsigned> &InputRegs,
				4704	const TargetRegisterInfo &TRI) const {
				4705	if (isOutReg) {
				4706	for (unsigned i = 0, e = AssignedRegs.Regs.size(); i != e; ++i)
				4707	MarkRegAndAliases(AssignedRegs.Regs[i], OutputRegs, TRI);
				4708	}
				4709	if (isInReg) {
				4710	for (unsigned i = 0, e = AssignedRegs.Regs.size(); i != e; ++i)
				4711	MarkRegAndAliases(AssignedRegs.Regs[i], InputRegs, TRI);
				4712	}
				4713	}
Chris Lattner	81249c9	2008-10-17 17:05:25 +0000	[diff] [blame]	4714
				4715	/// getCallOperandValMVT - Return the MVT of the Value* that this operand
				4716	/// corresponds to. If there is no Value* for this operand, it returns
				4717	/// MVT::Other.
				4718	MVT getCallOperandValMVT(const TargetLowering &TLI,
				4719	const TargetData *TD) const {
				4720	if (CallOperandVal == 0) return MVT::Other;
				4721
				4722	if (isa<BasicBlock>(CallOperandVal))
				4723	return TLI.getPointerTy();
				4724
				4725	const llvm::Type *OpTy = CallOperandVal->getType();
				4726
				4727	// If this is an indirect operand, the operand is a pointer to the
				4728	// accessed type.
				4729	if (isIndirect)
				4730	OpTy = cast<PointerType>(OpTy)->getElementType();
				4731
				4732	// If OpTy is not a single value, it may be a struct/union that we
				4733	// can tile with integers.
				4734	if (!OpTy->isSingleValueType() && OpTy->isSized()) {
				4735	unsigned BitSize = TD->getTypeSizeInBits(OpTy);
				4736	switch (BitSize) {
				4737	default: break;
				4738	case 1:
				4739	case 8:
				4740	case 16:
				4741	case 32:
				4742	case 64:
Chris Lattner	cfc14c1	2008-10-17 19:59:51 +0000	[diff] [blame]	4743	case 128:
Chris Lattner	81249c9	2008-10-17 17:05:25 +0000	[diff] [blame]	4744	OpTy = IntegerType::get(BitSize);
				4745	break;
				4746	}
				4747	}
				4748
				4749	return TLI.getValueType(OpTy, true);
				4750	}
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	4751
				4752	private:
				4753	/// MarkRegAndAliases - Mark the specified register and all aliases in the
				4754	/// specified set.
				4755	static void MarkRegAndAliases(unsigned Reg, std::set<unsigned> &Regs,
				4756	const TargetRegisterInfo &TRI) {
				4757	assert(TargetRegisterInfo::isPhysicalRegister(Reg) && "Isn't a physreg");
				4758	Regs.insert(Reg);
				4759	if (const unsigned *Aliases = TRI.getAliasSet(Reg))
				4760	for (; *Aliases; ++Aliases)
				4761	Regs.insert(*Aliases);
				4762	}
				4763	};
				4764	} // end llvm namespace.
				4765
				4766
				4767	/// GetRegistersForValue - Assign registers (virtual or physical) for the
				4768	/// specified operand. We prefer to assign virtual registers, to allow the
				4769	/// register allocator handle the assignment process. However, if the asm uses
				4770	/// features that we can't model on machineinstrs, we have SDISel do the
				4771	/// allocation. This produces generally horrible, but correct, code.
				4772	///
				4773	/// OpInfo describes the operand.
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	4774	/// Input and OutputRegs are the set of already allocated physical registers.
				4775	///
				4776	void SelectionDAGLowering::
Dale Johannesen	8e3455b	2008-09-24 23:13:09 +0000	[diff] [blame]	4777	GetRegistersForValue(SDISelAsmOperandInfo &OpInfo,
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	4778	std::set<unsigned> &OutputRegs,
				4779	std::set<unsigned> &InputRegs) {
				4780	// Compute whether this value requires an input register, an output register,
				4781	// or both.
				4782	bool isOutReg = false;
				4783	bool isInReg = false;
				4784	switch (OpInfo.Type) {
				4785	case InlineAsm::isOutput:
				4786	isOutReg = true;
				4787
Dale Johannesen	8e3455b	2008-09-24 23:13:09 +0000	[diff] [blame]	4788	// If there is an input constraint that matches this, we need to reserve
				4789	// the input register so no other inputs allocate to it.
Chris Lattner	6bdcda3	2008-10-17 16:47:46 +0000	[diff] [blame]	4790	isInReg = OpInfo.hasMatchingInput();
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	4791	break;
				4792	case InlineAsm::isInput:
				4793	isInReg = true;
				4794	isOutReg = false;
				4795	break;
				4796	case InlineAsm::isClobber:
				4797	isOutReg = true;
				4798	isInReg = true;
				4799	break;
				4800	}
				4801
				4802
				4803	MachineFunction &MF = DAG.getMachineFunction();
				4804	SmallVector<unsigned, 4> Regs;
				4805
				4806	// If this is a constraint for a single physreg, or a constraint for a
				4807	// register class, find it.
				4808	std::pair<unsigned, const TargetRegisterClass*> PhysReg =
				4809	TLI.getRegForInlineAsmConstraint(OpInfo.ConstraintCode,
				4810	OpInfo.ConstraintVT);
				4811
				4812	unsigned NumRegs = 1;
Chris Lattner	01426e1	2008-10-21 00:45:36 +0000	[diff] [blame]	4813	if (OpInfo.ConstraintVT != MVT::Other) {
				4814	// If this is a FP input in an integer register (or visa versa) insert a bit
				4815	// cast of the input value. More generally, handle any case where the input
				4816	// value disagrees with the register class we plan to stick this in.
				4817	if (OpInfo.Type == InlineAsm::isInput &&
				4818	PhysReg.second && !PhysReg.second->hasType(OpInfo.ConstraintVT)) {
				4819	// Try to convert to the first MVT that the reg class contains. If the
				4820	// types are identical size, use a bitcast to convert (e.g. two differing
				4821	// vector types).
				4822	MVT RegVT = *PhysReg.second->vt_begin();
				4823	if (RegVT.getSizeInBits() == OpInfo.ConstraintVT.getSizeInBits()) {
				4824	OpInfo.CallOperand = DAG.getNode(ISD::BIT_CONVERT, RegVT,
				4825	OpInfo.CallOperand);
				4826	OpInfo.ConstraintVT = RegVT;
				4827	} else if (RegVT.isInteger() && OpInfo.ConstraintVT.isFloatingPoint()) {
				4828	// If the input is a FP value and we want it in FP registers, do a
				4829	// bitcast to the corresponding integer type. This turns an f64 value
				4830	// into i64, which can be passed with two i32 values on a 32-bit
				4831	// machine.
				4832	RegVT = MVT::getIntegerVT(OpInfo.ConstraintVT.getSizeInBits());
				4833	OpInfo.CallOperand = DAG.getNode(ISD::BIT_CONVERT, RegVT,
				4834	OpInfo.CallOperand);
				4835	OpInfo.ConstraintVT = RegVT;
				4836	}
				4837	}
				4838
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	4839	NumRegs = TLI.getNumRegisters(OpInfo.ConstraintVT);
Chris Lattner	01426e1	2008-10-21 00:45:36 +0000	[diff] [blame]	4840	}
				4841
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	4842	MVT RegVT;
				4843	MVT ValueVT = OpInfo.ConstraintVT;
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	4844
				4845	// If this is a constraint for a specific physical register, like {r17},
				4846	// assign it now.
				4847	if (PhysReg.first) {
				4848	if (OpInfo.ConstraintVT == MVT::Other)
				4849	ValueVT = *PhysReg.second->vt_begin();
				4850
				4851	// Get the actual register value type. This is important, because the user
				4852	// may have asked for (e.g.) the AX register in i32 type. We need to
				4853	// remember that AX is actually i16 to get the right extension.
				4854	RegVT = *PhysReg.second->vt_begin();
				4855
				4856	// This is a explicit reference to a physical register.
				4857	Regs.push_back(PhysReg.first);
				4858
				4859	// If this is an expanded reference, add the rest of the regs to Regs.
				4860	if (NumRegs != 1) {
				4861	TargetRegisterClass::iterator I = PhysReg.second->begin();
				4862	for (; *I != PhysReg.first; ++I)
				4863	assert(I != PhysReg.second->end() && "Didn't find reg!");
				4864
				4865	// Already added the first reg.
				4866	--NumRegs; ++I;
				4867	for (; NumRegs; --NumRegs, ++I) {
				4868	assert(I != PhysReg.second->end() && "Ran out of registers to allocate!");
				4869	Regs.push_back(*I);
				4870	}
				4871	}
				4872	OpInfo.AssignedRegs = RegsForValue(TLI, Regs, RegVT, ValueVT);
				4873	const TargetRegisterInfo *TRI = DAG.getTarget().getRegisterInfo();
				4874	OpInfo.MarkAllocatedRegs(isOutReg, isInReg, OutputRegs, InputRegs, *TRI);
				4875	return;
				4876	}
				4877
				4878	// Otherwise, if this was a reference to an LLVM register class, create vregs
				4879	// for this reference.
				4880	std::vector<unsigned> RegClassRegs;
				4881	const TargetRegisterClass *RC = PhysReg.second;
				4882	if (RC) {
Dale Johannesen	8e3455b	2008-09-24 23:13:09 +0000	[diff] [blame]	4883	// If this is a tied register, our regalloc doesn't know how to maintain
Chris Lattner	58f15c4	2008-10-17 16:21:11 +0000	[diff] [blame]	4884	// the constraint, so we have to pick a register to pin the input/output to.
				4885	// If it isn't a matched constraint, go ahead and create vreg and let the
				4886	// regalloc do its thing.
Chris Lattner	6bdcda3	2008-10-17 16:47:46 +0000	[diff] [blame]	4887	if (!OpInfo.hasMatchingInput()) {
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	4888	RegVT = *PhysReg.second->vt_begin();
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	4889	if (OpInfo.ConstraintVT == MVT::Other)
				4890	ValueVT = RegVT;
				4891
				4892	// Create the appropriate number of virtual registers.
				4893	MachineRegisterInfo &RegInfo = MF.getRegInfo();
				4894	for (; NumRegs; --NumRegs)
				4895	Regs.push_back(RegInfo.createVirtualRegister(PhysReg.second));
				4896
				4897	OpInfo.AssignedRegs = RegsForValue(TLI, Regs, RegVT, ValueVT);
				4898	return;
				4899	}
				4900
				4901	// Otherwise, we can't allocate it. Let the code below figure out how to
				4902	// maintain these constraints.
				4903	RegClassRegs.assign(PhysReg.second->begin(), PhysReg.second->end());
				4904
				4905	} else {
				4906	// This is a reference to a register class that doesn't directly correspond
				4907	// to an LLVM register class. Allocate NumRegs consecutive, available,
				4908	// registers from the class.
				4909	RegClassRegs = TLI.getRegClassForInlineAsmConstraint(OpInfo.ConstraintCode,
				4910	OpInfo.ConstraintVT);
				4911	}
				4912
				4913	const TargetRegisterInfo *TRI = DAG.getTarget().getRegisterInfo();
				4914	unsigned NumAllocated = 0;
				4915	for (unsigned i = 0, e = RegClassRegs.size(); i != e; ++i) {
				4916	unsigned Reg = RegClassRegs[i];
				4917	// See if this register is available.
				4918	if ((isOutReg && OutputRegs.count(Reg)) \|\| // Already used.
				4919	(isInReg && InputRegs.count(Reg))) { // Already used.
				4920	// Make sure we find consecutive registers.
				4921	NumAllocated = 0;
				4922	continue;
				4923	}
				4924
				4925	// Check to see if this register is allocatable (i.e. don't give out the
				4926	// stack pointer).
				4927	if (RC == 0) {
				4928	RC = isAllocatableRegister(Reg, MF, TLI, TRI);
				4929	if (!RC) { // Couldn't allocate this register.
				4930	// Reset NumAllocated to make sure we return consecutive registers.
				4931	NumAllocated = 0;
				4932	continue;
				4933	}
				4934	}
				4935
				4936	// Okay, this register is good, we can use it.
				4937	++NumAllocated;
				4938
				4939	// If we allocated enough consecutive registers, succeed.
				4940	if (NumAllocated == NumRegs) {
				4941	unsigned RegStart = (i-NumAllocated)+1;
				4942	unsigned RegEnd = i+1;
				4943	// Mark all of the allocated registers used.
				4944	for (unsigned i = RegStart; i != RegEnd; ++i)
				4945	Regs.push_back(RegClassRegs[i]);
				4946
				4947	OpInfo.AssignedRegs = RegsForValue(TLI, Regs, *RC->vt_begin(),
				4948	OpInfo.ConstraintVT);
				4949	OpInfo.MarkAllocatedRegs(isOutReg, isInReg, OutputRegs, InputRegs, *TRI);
				4950	return;
				4951	}
				4952	}
				4953
				4954	// Otherwise, we couldn't allocate enough registers for this.
				4955	}
				4956
Evan Cheng	da43bcf	2008-09-24 00:05:32 +0000	[diff] [blame]	4957	/// hasInlineAsmMemConstraint - Return true if the inline asm instruction being
				4958	/// processed uses a memory 'm' constraint.
				4959	static bool
				4960	hasInlineAsmMemConstraint(std::vector<InlineAsm::ConstraintInfo> &CInfos,
				4961	TargetLowering &TLI) {
				4962	for (unsigned i = 0, e = CInfos.size(); i != e; ++i) {
				4963	InlineAsm::ConstraintInfo &CI = CInfos[i];
				4964	for (unsigned j = 0, ee = CI.Codes.size(); j != ee; ++j) {
				4965	TargetLowering::ConstraintType CType = TLI.getConstraintType(CI.Codes[j]);
				4966	if (CType == TargetLowering::C_Memory)
				4967	return true;
				4968	}
				4969	}
				4970
				4971	return false;
				4972	}
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	4973
				4974	/// visitInlineAsm - Handle a call to an InlineAsm object.
				4975	///
				4976	void SelectionDAGLowering::visitInlineAsm(CallSite CS) {
				4977	InlineAsm *IA = cast<InlineAsm>(CS.getCalledValue());
				4978
				4979	/// ConstraintOperands - Information about all of the constraints.
				4980	std::vector<SDISelAsmOperandInfo> ConstraintOperands;
				4981
				4982	SDValue Chain = getRoot();
				4983	SDValue Flag;
				4984
				4985	std::set<unsigned> OutputRegs, InputRegs;
				4986
				4987	// Do a prepass over the constraints, canonicalizing them, and building up the
				4988	// ConstraintOperands list.
				4989	std::vector<InlineAsm::ConstraintInfo>
				4990	ConstraintInfos = IA->ParseConstraints();
				4991
Evan Cheng	da43bcf	2008-09-24 00:05:32 +0000	[diff] [blame]	4992	bool hasMemory = hasInlineAsmMemConstraint(ConstraintInfos, TLI);
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	4993
				4994	unsigned ArgNo = 0; // ArgNo - The argument of the CallInst.
				4995	unsigned ResNo = 0; // ResNo - The result number of the next output.
				4996	for (unsigned i = 0, e = ConstraintInfos.size(); i != e; ++i) {
				4997	ConstraintOperands.push_back(SDISelAsmOperandInfo(ConstraintInfos[i]));
				4998	SDISelAsmOperandInfo &OpInfo = ConstraintOperands.back();
				4999
				5000	MVT OpVT = MVT::Other;
				5001
				5002	// Compute the value type for each operand.
				5003	switch (OpInfo.Type) {
				5004	case InlineAsm::isOutput:
				5005	// Indirect outputs just consume an argument.
				5006	if (OpInfo.isIndirect) {
				5007	OpInfo.CallOperandVal = CS.getArgument(ArgNo++);
				5008	break;
				5009	}
Chris Lattner	2a0b96c	2008-10-18 18:49:30 +0000	[diff] [blame]	5010
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	5011	// The return value of the call is this value. As such, there is no
				5012	// corresponding argument.
				5013	assert(CS.getType() != Type::VoidTy && "Bad inline asm!");
				5014	if (const StructType *STy = dyn_cast<StructType>(CS.getType())) {
				5015	OpVT = TLI.getValueType(STy->getElementType(ResNo));
				5016	} else {
				5017	assert(ResNo == 0 && "Asm only has one result!");
				5018	OpVT = TLI.getValueType(CS.getType());
				5019	}
				5020	++ResNo;
				5021	break;
				5022	case InlineAsm::isInput:
				5023	OpInfo.CallOperandVal = CS.getArgument(ArgNo++);
				5024	break;
				5025	case InlineAsm::isClobber:
				5026	// Nothing to do.
				5027	break;
				5028	}
				5029
				5030	// If this is an input or an indirect output, process the call argument.
				5031	// BasicBlocks are labels, currently appearing only in asm's.
				5032	if (OpInfo.CallOperandVal) {
Chris Lattner	81249c9	2008-10-17 17:05:25 +0000	[diff] [blame]	5033	if (BasicBlock *BB = dyn_cast<BasicBlock>(OpInfo.CallOperandVal)) {
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	5034	OpInfo.CallOperand = DAG.getBasicBlock(FuncInfo.MBBMap[BB]);
Chris Lattner	81249c9	2008-10-17 17:05:25 +0000	[diff] [blame]	5035	} else {
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	5036	OpInfo.CallOperand = getValue(OpInfo.CallOperandVal);
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	5037	}
Chris Lattner	81249c9	2008-10-17 17:05:25 +0000	[diff] [blame]	5038
				5039	OpVT = OpInfo.getCallOperandValMVT(TLI, TD);
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	5040	}
				5041
				5042	OpInfo.ConstraintVT = OpVT;
Chris Lattner	2a0b96c	2008-10-18 18:49:30 +0000	[diff] [blame]	5043	}
				5044
				5045	// Second pass over the constraints: compute which constraint option to use
				5046	// and assign registers to constraints that want a specific physreg.
				5047	for (unsigned i = 0, e = ConstraintInfos.size(); i != e; ++i) {
				5048	SDISelAsmOperandInfo &OpInfo = ConstraintOperands[i];
				5049
				5050	// If this is an output operand with a matching input operand, look up the
Evan Cheng	09dc9c0	2008-12-16 18:21:39 +0000	[diff] [blame^]	5051	// matching input. If their types mismatch, e.g. one is an integer, the
				5052	// other is floating point, or their sizes are different, flag it as an
				5053	// error.
Chris Lattner	2a0b96c	2008-10-18 18:49:30 +0000	[diff] [blame]	5054	if (OpInfo.hasMatchingInput()) {
				5055	SDISelAsmOperandInfo &Input = ConstraintOperands[OpInfo.MatchingInput];
				5056	if (OpInfo.ConstraintVT != Input.ConstraintVT) {
Evan Cheng	09dc9c0	2008-12-16 18:21:39 +0000	[diff] [blame^]	5057	if ((OpInfo.ConstraintVT.isInteger() !=
				5058	Input.ConstraintVT.isInteger()) \|\|
				5059	(OpInfo.ConstraintVT.getSizeInBits() !=
				5060	Input.ConstraintVT.getSizeInBits())) {
				5061	cerr << "Unsupported asm: input constraint with a matching output "
				5062	<< "constraint of incompatible type!\n";
				5063	exit(1);
				5064	}
				5065	Input.ConstraintVT = OpInfo.ConstraintVT;
Chris Lattner	2a0b96c	2008-10-18 18:49:30 +0000	[diff] [blame]	5066	}
				5067	}
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	5068
				5069	// Compute the constraint code and ConstraintType to use.
Evan Cheng	da43bcf	2008-09-24 00:05:32 +0000	[diff] [blame]	5070	TLI.ComputeConstraintToUse(OpInfo, OpInfo.CallOperand, hasMemory, &DAG);
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	5071
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	5072	// If this is a memory input, and if the operand is not indirect, do what we
				5073	// need to to provide an address for the memory input.
				5074	if (OpInfo.ConstraintType == TargetLowering::C_Memory &&
				5075	!OpInfo.isIndirect) {
				5076	assert(OpInfo.Type == InlineAsm::isInput &&
				5077	"Can only indirectify direct input operands!");
				5078
				5079	// Memory operands really want the address of the value. If we don't have
				5080	// an indirect input, put it in the constpool if we can, otherwise spill
				5081	// it to a stack slot.
				5082
				5083	// If the operand is a float, integer, or vector constant, spill to a
				5084	// constant pool entry to get its address.
				5085	Value *OpVal = OpInfo.CallOperandVal;
				5086	if (isa<ConstantFP>(OpVal) \|\| isa<ConstantInt>(OpVal) \|\|
				5087	isa<ConstantVector>(OpVal)) {
				5088	OpInfo.CallOperand = DAG.getConstantPool(cast<Constant>(OpVal),
				5089	TLI.getPointerTy());
				5090	} else {
				5091	// Otherwise, create a stack slot and emit a store to it before the
				5092	// asm.
				5093	const Type *Ty = OpVal->getType();
				5094	uint64_t TySize = TLI.getTargetData()->getABITypeSize(Ty);
				5095	unsigned Align = TLI.getTargetData()->getPrefTypeAlignment(Ty);
				5096	MachineFunction &MF = DAG.getMachineFunction();
				5097	int SSFI = MF.getFrameInfo()->CreateStackObject(TySize, Align);
				5098	SDValue StackSlot = DAG.getFrameIndex(SSFI, TLI.getPointerTy());
				5099	Chain = DAG.getStore(Chain, OpInfo.CallOperand, StackSlot, NULL, 0);
				5100	OpInfo.CallOperand = StackSlot;
				5101	}
				5102
				5103	// There is no longer a Value* corresponding to this operand.
				5104	OpInfo.CallOperandVal = 0;
				5105	// It is now an indirect operand.
				5106	OpInfo.isIndirect = true;
				5107	}
				5108
				5109	// If this constraint is for a specific register, allocate it before
				5110	// anything else.
				5111	if (OpInfo.ConstraintType == TargetLowering::C_Register)
Dale Johannesen	8e3455b	2008-09-24 23:13:09 +0000	[diff] [blame]	5112	GetRegistersForValue(OpInfo, OutputRegs, InputRegs);
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	5113	}
				5114	ConstraintInfos.clear();
				5115
				5116
				5117	// Second pass - Loop over all of the operands, assigning virtual or physregs
Chris Lattner	58f15c4	2008-10-17 16:21:11 +0000	[diff] [blame]	5118	// to register class operands.
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	5119	for (unsigned i = 0, e = ConstraintOperands.size(); i != e; ++i) {
				5120	SDISelAsmOperandInfo &OpInfo = ConstraintOperands[i];
				5121
				5122	// C_Register operands have already been allocated, Other/Memory don't need
				5123	// to be.
				5124	if (OpInfo.ConstraintType == TargetLowering::C_RegisterClass)
Dale Johannesen	8e3455b	2008-09-24 23:13:09 +0000	[diff] [blame]	5125	GetRegistersForValue(OpInfo, OutputRegs, InputRegs);
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	5126	}
				5127
				5128	// AsmNodeOperands - The operands for the ISD::INLINEASM node.
				5129	std::vector<SDValue> AsmNodeOperands;
				5130	AsmNodeOperands.push_back(SDValue()); // reserve space for input chain
				5131	AsmNodeOperands.push_back(
Bill Wendling	056292f	2008-09-16 21:48:12 +0000	[diff] [blame]	5132	DAG.getTargetExternalSymbol(IA->getAsmString().c_str(), MVT::Other));
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	5133
				5134
				5135	// Loop over all of the inputs, copying the operand values into the
				5136	// appropriate registers and processing the output regs.
				5137	RegsForValue RetValRegs;
				5138
				5139	// IndirectStoresToEmit - The set of stores to emit after the inline asm node.
				5140	std::vector<std::pair<RegsForValue, Value*> > IndirectStoresToEmit;
				5141
				5142	for (unsigned i = 0, e = ConstraintOperands.size(); i != e; ++i) {
				5143	SDISelAsmOperandInfo &OpInfo = ConstraintOperands[i];
				5144
				5145	switch (OpInfo.Type) {
				5146	case InlineAsm::isOutput: {
				5147	if (OpInfo.ConstraintType != TargetLowering::C_RegisterClass &&
				5148	OpInfo.ConstraintType != TargetLowering::C_Register) {
				5149	// Memory output, or 'other' output (e.g. 'X' constraint).
				5150	assert(OpInfo.isIndirect && "Memory output must be indirect operand");
				5151
				5152	// Add information to the INLINEASM node to know about this output.
Dale Johannesen	86b49f8	2008-09-24 01:07:17 +0000	[diff] [blame]	5153	unsigned ResOpType = 4/MEM/ \| (1<<3);
				5154	AsmNodeOperands.push_back(DAG.getTargetConstant(ResOpType,
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	5155	TLI.getPointerTy()));
				5156	AsmNodeOperands.push_back(OpInfo.CallOperand);
				5157	break;
				5158	}
				5159
				5160	// Otherwise, this is a register or register class output.
				5161
				5162	// Copy the output from the appropriate register. Find a register that
				5163	// we can use.
				5164	if (OpInfo.AssignedRegs.Regs.empty()) {
				5165	cerr << "Couldn't allocate output reg for constraint '"
				5166	<< OpInfo.ConstraintCode << "'!\n";
				5167	exit(1);
				5168	}
				5169
				5170	// If this is an indirect operand, store through the pointer after the
				5171	// asm.
				5172	if (OpInfo.isIndirect) {
				5173	IndirectStoresToEmit.push_back(std::make_pair(OpInfo.AssignedRegs,
				5174	OpInfo.CallOperandVal));
				5175	} else {
				5176	// This is the result value of the call.
				5177	assert(CS.getType() != Type::VoidTy && "Bad inline asm!");
				5178	// Concatenate this output onto the outputs list.
				5179	RetValRegs.append(OpInfo.AssignedRegs);
				5180	}
				5181
				5182	// Add information to the INLINEASM node to know that this register is
				5183	// set.
Dale Johannesen	913d3df	2008-09-12 17:49:03 +0000	[diff] [blame]	5184	OpInfo.AssignedRegs.AddInlineAsmOperands(OpInfo.isEarlyClobber ?
				5185	6 /* EARLYCLOBBER REGDEF */ :
				5186	2 /* REGDEF */ ,
				5187	DAG, AsmNodeOperands);
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	5188	break;
				5189	}
				5190	case InlineAsm::isInput: {
				5191	SDValue InOperandVal = OpInfo.CallOperand;
				5192
Chris Lattner	6bdcda3	2008-10-17 16:47:46 +0000	[diff] [blame]	5193	if (OpInfo.isMatchingInputConstraint()) { // Matching constraint?
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	5194	// If this is required to match an output register we have already set,
				5195	// just use its register.
Chris Lattner	58f15c4	2008-10-17 16:21:11 +0000	[diff] [blame]	5196	unsigned OperandNo = OpInfo.getMatchedOperand();
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	5197
				5198	// Scan until we find the definition we already emitted of this operand.
				5199	// When we find it, create a RegsForValue operand.
				5200	unsigned CurOp = 2; // The first operand.
				5201	for (; OperandNo; --OperandNo) {
				5202	// Advance to the next operand.
				5203	unsigned NumOps =
Dan Gohman	f5aeb1a	2008-09-12 16:56:44 +0000	[diff] [blame]	5204	cast<ConstantSDNode>(AsmNodeOperands[CurOp])->getZExtValue();
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	5205	assert(((NumOps & 7) == 2 /REGDEF/ \|\|
Dale Johannesen	913d3df	2008-09-12 17:49:03 +0000	[diff] [blame]	5206	(NumOps & 7) == 6 /EARLYCLOBBER REGDEF/ \|\|
Dale Johannesen	86b49f8	2008-09-24 01:07:17 +0000	[diff] [blame]	5207	(NumOps & 7) == 4 /MEM/) &&
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	5208	"Skipped past definitions?");
				5209	CurOp += (NumOps>>3)+1;
				5210	}
				5211
				5212	unsigned NumOps =
Dan Gohman	f5aeb1a	2008-09-12 16:56:44 +0000	[diff] [blame]	5213	cast<ConstantSDNode>(AsmNodeOperands[CurOp])->getZExtValue();
Dale Johannesen	913d3df	2008-09-12 17:49:03 +0000	[diff] [blame]	5214	if ((NumOps & 7) == 2 /REGDEF/
				5215	\|\| (NumOps & 7) == 6 /* EARLYCLOBBER REGDEF */) {
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	5216	// Add NumOps>>3 registers to MatchedRegs.
				5217	RegsForValue MatchedRegs;
				5218	MatchedRegs.TLI = &TLI;
				5219	MatchedRegs.ValueVTs.push_back(InOperandVal.getValueType());
				5220	MatchedRegs.RegVTs.push_back(AsmNodeOperands[CurOp+1].getValueType());
				5221	for (unsigned i = 0, e = NumOps>>3; i != e; ++i) {
				5222	unsigned Reg =
				5223	cast<RegisterSDNode>(AsmNodeOperands[++CurOp])->getReg();
				5224	MatchedRegs.Regs.push_back(Reg);
				5225	}
				5226
				5227	// Use the produced MatchedRegs object to
				5228	MatchedRegs.getCopyToRegs(InOperandVal, DAG, Chain, &Flag);
Dale Johannesen	86b49f8	2008-09-24 01:07:17 +0000	[diff] [blame]	5229	MatchedRegs.AddInlineAsmOperands(1 /REGUSE/, DAG, AsmNodeOperands);
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	5230	break;
				5231	} else {
Dale Johannesen	86b49f8	2008-09-24 01:07:17 +0000	[diff] [blame]	5232	assert(((NumOps & 7) == 4) && "Unknown matching constraint!");
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	5233	assert((NumOps >> 3) == 1 && "Unexpected number of operands");
				5234	// Add information to the INLINEASM node to know about this input.
Dale Johannesen	91aac10	2008-09-17 21:13:11 +0000	[diff] [blame]	5235	AsmNodeOperands.push_back(DAG.getTargetConstant(NumOps,
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	5236	TLI.getPointerTy()));
				5237	AsmNodeOperands.push_back(AsmNodeOperands[CurOp+1]);
				5238	break;
				5239	}
				5240	}
				5241
				5242	if (OpInfo.ConstraintType == TargetLowering::C_Other) {
				5243	assert(!OpInfo.isIndirect &&
				5244	"Don't know how to handle indirect other inputs yet!");
				5245
				5246	std::vector<SDValue> Ops;
				5247	TLI.LowerAsmOperandForConstraint(InOperandVal, OpInfo.ConstraintCode[0],
Evan Cheng	da43bcf	2008-09-24 00:05:32 +0000	[diff] [blame]	5248	hasMemory, Ops, DAG);
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	5249	if (Ops.empty()) {
				5250	cerr << "Invalid operand for inline asm constraint '"
				5251	<< OpInfo.ConstraintCode << "'!\n";
				5252	exit(1);
				5253	}
				5254
				5255	// Add information to the INLINEASM node to know about this input.
				5256	unsigned ResOpType = 3 /IMM/ \| (Ops.size() << 3);
				5257	AsmNodeOperands.push_back(DAG.getTargetConstant(ResOpType,
				5258	TLI.getPointerTy()));
				5259	AsmNodeOperands.insert(AsmNodeOperands.end(), Ops.begin(), Ops.end());
				5260	break;
				5261	} else if (OpInfo.ConstraintType == TargetLowering::C_Memory) {
				5262	assert(OpInfo.isIndirect && "Operand must be indirect to be a mem!");
				5263	assert(InOperandVal.getValueType() == TLI.getPointerTy() &&
				5264	"Memory operands expect pointer values");
				5265
				5266	// Add information to the INLINEASM node to know about this input.
Dale Johannesen	86b49f8	2008-09-24 01:07:17 +0000	[diff] [blame]	5267	unsigned ResOpType = 4/MEM/ \| (1<<3);
				5268	AsmNodeOperands.push_back(DAG.getTargetConstant(ResOpType,
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	5269	TLI.getPointerTy()));
				5270	AsmNodeOperands.push_back(InOperandVal);
				5271	break;
				5272	}
				5273
				5274	assert((OpInfo.ConstraintType == TargetLowering::C_RegisterClass \|\|
				5275	OpInfo.ConstraintType == TargetLowering::C_Register) &&
				5276	"Unknown constraint type!");
				5277	assert(!OpInfo.isIndirect &&
				5278	"Don't know how to handle indirect register inputs yet!");
				5279
				5280	// Copy the input into the appropriate registers.
Evan Cheng	aa765b8	2008-09-25 00:14:04 +0000	[diff] [blame]	5281	if (OpInfo.AssignedRegs.Regs.empty()) {
				5282	cerr << "Couldn't allocate output reg for constraint '"
				5283	<< OpInfo.ConstraintCode << "'!\n";
				5284	exit(1);
				5285	}
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	5286
				5287	OpInfo.AssignedRegs.getCopyToRegs(InOperandVal, DAG, Chain, &Flag);
				5288
Dale Johannesen	86b49f8	2008-09-24 01:07:17 +0000	[diff] [blame]	5289	OpInfo.AssignedRegs.AddInlineAsmOperands(1/REGUSE/,
				5290	DAG, AsmNodeOperands);
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	5291	break;
				5292	}
				5293	case InlineAsm::isClobber: {
				5294	// Add the clobbered value to the operand list, so that the register
				5295	// allocator is aware that the physreg got clobbered.
				5296	if (!OpInfo.AssignedRegs.Regs.empty())
Dale Johannesen	91aac10	2008-09-17 21:13:11 +0000	[diff] [blame]	5297	OpInfo.AssignedRegs.AddInlineAsmOperands(6 /* EARLYCLOBBER REGDEF */,
				5298	DAG, AsmNodeOperands);
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	5299	break;
				5300	}
				5301	}
				5302	}
				5303
				5304	// Finish up input operands.
				5305	AsmNodeOperands[0] = Chain;
				5306	if (Flag.getNode()) AsmNodeOperands.push_back(Flag);
				5307
				5308	Chain = DAG.getNode(ISD::INLINEASM,
				5309	DAG.getNodeValueTypes(MVT::Other, MVT::Flag), 2,
				5310	&AsmNodeOperands[0], AsmNodeOperands.size());
				5311	Flag = Chain.getValue(1);
				5312
				5313	// If this asm returns a register value, copy the result from that register
				5314	// and set it as the value of the call.
				5315	if (!RetValRegs.Regs.empty()) {
				5316	SDValue Val = RetValRegs.getCopyFromRegs(DAG, Chain, &Flag);
Chris Lattner	2a0b96c	2008-10-18 18:49:30 +0000	[diff] [blame]	5317
				5318	// FIXME: Why don't we do this for inline asms with MRVs?
				5319	if (CS.getType()->isSingleValueType() && CS.getType()->isSized()) {
				5320	MVT ResultType = TLI.getValueType(CS.getType());
				5321
				5322	// If any of the results of the inline asm is a vector, it may have the
				5323	// wrong width/num elts. This can happen for register classes that can
				5324	// contain multiple different value types. The preg or vreg allocated may
				5325	// not have the same VT as was expected. Convert it to the right type
				5326	// with bit_convert.
				5327	if (ResultType != Val.getValueType() && Val.getValueType().isVector()) {
				5328	Val = DAG.getNode(ISD::BIT_CONVERT, ResultType, Val);
Dan Gohman	9591573	2008-10-18 01:03:45 +0000	[diff] [blame]	5329
Chris Lattner	2a0b96c	2008-10-18 18:49:30 +0000	[diff] [blame]	5330	} else if (ResultType != Val.getValueType() &&
				5331	ResultType.isInteger() && Val.getValueType().isInteger()) {
				5332	// If a result value was tied to an input value, the computed result may
				5333	// have a wider width than the expected result. Extract the relevant
				5334	// portion.
				5335	Val = DAG.getNode(ISD::TRUNCATE, ResultType, Val);
Dan Gohman	9591573	2008-10-18 01:03:45 +0000	[diff] [blame]	5336	}
Chris Lattner	2a0b96c	2008-10-18 18:49:30 +0000	[diff] [blame]	5337
				5338	assert(ResultType == Val.getValueType() && "Asm result value mismatch!");
Chris Lattner	0c52644	2008-10-17 17:52:49 +0000	[diff] [blame]	5339	}
Dan Gohman	9591573	2008-10-18 01:03:45 +0000	[diff] [blame]	5340
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	5341	setValue(CS.getInstruction(), Val);
				5342	}
				5343
				5344	std::vector<std::pair<SDValue, Value*> > StoresToEmit;
				5345
				5346	// Process indirect outputs, first output all of the flagged copies out of
				5347	// physregs.
				5348	for (unsigned i = 0, e = IndirectStoresToEmit.size(); i != e; ++i) {
				5349	RegsForValue &OutRegs = IndirectStoresToEmit[i].first;
				5350	Value *Ptr = IndirectStoresToEmit[i].second;
				5351	SDValue OutVal = OutRegs.getCopyFromRegs(DAG, Chain, &Flag);
				5352	StoresToEmit.push_back(std::make_pair(OutVal, Ptr));
				5353	}
				5354
				5355	// Emit the non-flagged stores from the physregs.
				5356	SmallVector<SDValue, 8> OutChains;
				5357	for (unsigned i = 0, e = StoresToEmit.size(); i != e; ++i)
				5358	OutChains.push_back(DAG.getStore(Chain, StoresToEmit[i].first,
				5359	getValue(StoresToEmit[i].second),
				5360	StoresToEmit[i].second, 0));
				5361	if (!OutChains.empty())
				5362	Chain = DAG.getNode(ISD::TokenFactor, MVT::Other,
				5363	&OutChains[0], OutChains.size());
				5364	DAG.setRoot(Chain);
				5365	}
				5366
				5367
				5368	void SelectionDAGLowering::visitMalloc(MallocInst &I) {
				5369	SDValue Src = getValue(I.getOperand(0));
				5370
				5371	MVT IntPtr = TLI.getPointerTy();
				5372
				5373	if (IntPtr.bitsLT(Src.getValueType()))
				5374	Src = DAG.getNode(ISD::TRUNCATE, IntPtr, Src);
				5375	else if (IntPtr.bitsGT(Src.getValueType()))
				5376	Src = DAG.getNode(ISD::ZERO_EXTEND, IntPtr, Src);
				5377
				5378	// Scale the source by the type size.
				5379	uint64_t ElementSize = TD->getABITypeSize(I.getType()->getElementType());
				5380	Src = DAG.getNode(ISD::MUL, Src.getValueType(),
				5381	Src, DAG.getIntPtrConstant(ElementSize));
				5382
				5383	TargetLowering::ArgListTy Args;
				5384	TargetLowering::ArgListEntry Entry;
				5385	Entry.Node = Src;
				5386	Entry.Ty = TLI.getTargetData()->getIntPtrType();
				5387	Args.push_back(Entry);
				5388
				5389	std::pair<SDValue,SDValue> Result =
Dale Johannesen	86098bd	2008-09-26 19:31:26 +0000	[diff] [blame]	5390	TLI.LowerCallTo(getRoot(), I.getType(), false, false, false, false,
				5391	CallingConv::C, PerformTailCallOpt,
				5392	DAG.getExternalSymbol("malloc", IntPtr),
Dan Gohman	1937e2f	2008-09-16 01:42:28 +0000	[diff] [blame]	5393	Args, DAG);
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	5394	setValue(&I, Result.first); // Pointers always fit in registers
				5395	DAG.setRoot(Result.second);
				5396	}
				5397
				5398	void SelectionDAGLowering::visitFree(FreeInst &I) {
				5399	TargetLowering::ArgListTy Args;
				5400	TargetLowering::ArgListEntry Entry;
				5401	Entry.Node = getValue(I.getOperand(0));
				5402	Entry.Ty = TLI.getTargetData()->getIntPtrType();
				5403	Args.push_back(Entry);
				5404	MVT IntPtr = TLI.getPointerTy();
				5405	std::pair<SDValue,SDValue> Result =
Dale Johannesen	86098bd	2008-09-26 19:31:26 +0000	[diff] [blame]	5406	TLI.LowerCallTo(getRoot(), Type::VoidTy, false, false, false, false,
Dan Gohman	1937e2f	2008-09-16 01:42:28 +0000	[diff] [blame]	5407	CallingConv::C, PerformTailCallOpt,
Bill Wendling	056292f	2008-09-16 21:48:12 +0000	[diff] [blame]	5408	DAG.getExternalSymbol("free", IntPtr), Args, DAG);
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	5409	DAG.setRoot(Result.second);
				5410	}
				5411
				5412	void SelectionDAGLowering::visitVAStart(CallInst &I) {
				5413	DAG.setRoot(DAG.getNode(ISD::VASTART, MVT::Other, getRoot(),
				5414	getValue(I.getOperand(1)),
				5415	DAG.getSrcValue(I.getOperand(1))));
				5416	}
				5417
				5418	void SelectionDAGLowering::visitVAArg(VAArgInst &I) {
				5419	SDValue V = DAG.getVAArg(TLI.getValueType(I.getType()), getRoot(),
				5420	getValue(I.getOperand(0)),
				5421	DAG.getSrcValue(I.getOperand(0)));
				5422	setValue(&I, V);
				5423	DAG.setRoot(V.getValue(1));
				5424	}
				5425
				5426	void SelectionDAGLowering::visitVAEnd(CallInst &I) {
				5427	DAG.setRoot(DAG.getNode(ISD::VAEND, MVT::Other, getRoot(),
				5428	getValue(I.getOperand(1)),
				5429	DAG.getSrcValue(I.getOperand(1))));
				5430	}
				5431
				5432	void SelectionDAGLowering::visitVACopy(CallInst &I) {
				5433	DAG.setRoot(DAG.getNode(ISD::VACOPY, MVT::Other, getRoot(),
				5434	getValue(I.getOperand(1)),
				5435	getValue(I.getOperand(2)),
				5436	DAG.getSrcValue(I.getOperand(1)),
				5437	DAG.getSrcValue(I.getOperand(2))));
				5438	}
				5439
				5440	/// TargetLowering::LowerArguments - This is the default LowerArguments
				5441	/// implementation, which just inserts a FORMAL_ARGUMENTS node. FIXME: When all
				5442	/// targets are migrated to using FORMAL_ARGUMENTS, this hook should be
				5443	/// integrated into SDISel.
				5444	void TargetLowering::LowerArguments(Function &F, SelectionDAG &DAG,
				5445	SmallVectorImpl<SDValue> &ArgValues) {
				5446	// Add CC# and isVararg as operands to the FORMAL_ARGUMENTS node.
				5447	SmallVector<SDValue, 3+16> Ops;
				5448	Ops.push_back(DAG.getRoot());
				5449	Ops.push_back(DAG.getConstant(F.getCallingConv(), getPointerTy()));
				5450	Ops.push_back(DAG.getConstant(F.isVarArg(), getPointerTy()));
				5451
				5452	// Add one result value for each formal argument.
				5453	SmallVector<MVT, 16> RetVals;
				5454	unsigned j = 1;
				5455	for (Function::arg_iterator I = F.arg_begin(), E = F.arg_end();
				5456	I != E; ++I, ++j) {
				5457	SmallVector<MVT, 4> ValueVTs;
				5458	ComputeValueVTs(*this, I->getType(), ValueVTs);
				5459	for (unsigned Value = 0, NumValues = ValueVTs.size();
				5460	Value != NumValues; ++Value) {
				5461	MVT VT = ValueVTs[Value];
				5462	const Type *ArgTy = VT.getTypeForMVT();
				5463	ISD::ArgFlagsTy Flags;
				5464	unsigned OriginalAlignment =
				5465	getTargetData()->getABITypeAlignment(ArgTy);
				5466
Devang Patel	0598866	2008-09-25 21:00:45 +0000	[diff] [blame]	5467	if (F.paramHasAttr(j, Attribute::ZExt))
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	5468	Flags.setZExt();
Devang Patel	0598866	2008-09-25 21:00:45 +0000	[diff] [blame]	5469	if (F.paramHasAttr(j, Attribute::SExt))
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	5470	Flags.setSExt();
Devang Patel	0598866	2008-09-25 21:00:45 +0000	[diff] [blame]	5471	if (F.paramHasAttr(j, Attribute::InReg))
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	5472	Flags.setInReg();
Devang Patel	0598866	2008-09-25 21:00:45 +0000	[diff] [blame]	5473	if (F.paramHasAttr(j, Attribute::StructRet))
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	5474	Flags.setSRet();
Devang Patel	0598866	2008-09-25 21:00:45 +0000	[diff] [blame]	5475	if (F.paramHasAttr(j, Attribute::ByVal)) {
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	5476	Flags.setByVal();
				5477	const PointerType *Ty = cast<PointerType>(I->getType());
				5478	const Type *ElementTy = Ty->getElementType();
				5479	unsigned FrameAlign = getByValTypeAlignment(ElementTy);
				5480	unsigned FrameSize = getTargetData()->getABITypeSize(ElementTy);
				5481	// For ByVal, alignment should be passed from FE. BE will guess if
				5482	// this info is not there but there are cases it cannot get right.
				5483	if (F.getParamAlignment(j))
				5484	FrameAlign = F.getParamAlignment(j);
				5485	Flags.setByValAlign(FrameAlign);
				5486	Flags.setByValSize(FrameSize);
				5487	}
Devang Patel	0598866	2008-09-25 21:00:45 +0000	[diff] [blame]	5488	if (F.paramHasAttr(j, Attribute::Nest))
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	5489	Flags.setNest();
				5490	Flags.setOrigAlign(OriginalAlignment);
				5491
				5492	MVT RegisterVT = getRegisterType(VT);
				5493	unsigned NumRegs = getNumRegisters(VT);
				5494	for (unsigned i = 0; i != NumRegs; ++i) {
				5495	RetVals.push_back(RegisterVT);
				5496	ISD::ArgFlagsTy MyFlags = Flags;
				5497	if (NumRegs > 1 && i == 0)
				5498	MyFlags.setSplit();
				5499	// if it isn't first piece, alignment must be 1
				5500	else if (i > 0)
				5501	MyFlags.setOrigAlign(1);
				5502	Ops.push_back(DAG.getArgFlags(MyFlags));
				5503	}
				5504	}
				5505	}
				5506
				5507	RetVals.push_back(MVT::Other);
				5508
				5509	// Create the node.
				5510	SDNode *Result = DAG.getNode(ISD::FORMAL_ARGUMENTS,
				5511	DAG.getVTList(&RetVals[0], RetVals.size()),
				5512	&Ops[0], Ops.size()).getNode();
				5513
				5514	// Prelower FORMAL_ARGUMENTS. This isn't required for functionality, but
				5515	// allows exposing the loads that may be part of the argument access to the
				5516	// first DAGCombiner pass.
				5517	SDValue TmpRes = LowerOperation(SDValue(Result, 0), DAG);
				5518
				5519	// The number of results should match up, except that the lowered one may have
				5520	// an extra flag result.
				5521	assert((Result->getNumValues() == TmpRes.getNode()->getNumValues() \|\|
				5522	(Result->getNumValues()+1 == TmpRes.getNode()->getNumValues() &&
				5523	TmpRes.getValue(Result->getNumValues()).getValueType() == MVT::Flag))
				5524	&& "Lowering produced unexpected number of results!");
				5525
				5526	// The FORMAL_ARGUMENTS node itself is likely no longer needed.
				5527	if (Result != TmpRes.getNode() && Result->use_empty()) {
				5528	HandleSDNode Dummy(DAG.getRoot());
				5529	DAG.RemoveDeadNode(Result);
				5530	}
				5531
				5532	Result = TmpRes.getNode();
				5533
				5534	unsigned NumArgRegs = Result->getNumValues() - 1;
				5535	DAG.setRoot(SDValue(Result, NumArgRegs));
				5536
				5537	// Set up the return result vector.
				5538	unsigned i = 0;
				5539	unsigned Idx = 1;
				5540	for (Function::arg_iterator I = F.arg_begin(), E = F.arg_end(); I != E;
				5541	++I, ++Idx) {
				5542	SmallVector<MVT, 4> ValueVTs;
				5543	ComputeValueVTs(*this, I->getType(), ValueVTs);
				5544	for (unsigned Value = 0, NumValues = ValueVTs.size();
				5545	Value != NumValues; ++Value) {
				5546	MVT VT = ValueVTs[Value];
				5547	MVT PartVT = getRegisterType(VT);
				5548
				5549	unsigned NumParts = getNumRegisters(VT);
				5550	SmallVector<SDValue, 4> Parts(NumParts);
				5551	for (unsigned j = 0; j != NumParts; ++j)
				5552	Parts[j] = SDValue(Result, i++);
				5553
				5554	ISD::NodeType AssertOp = ISD::DELETED_NODE;
Devang Patel	0598866	2008-09-25 21:00:45 +0000	[diff] [blame]	5555	if (F.paramHasAttr(Idx, Attribute::SExt))
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	5556	AssertOp = ISD::AssertSext;
Devang Patel	0598866	2008-09-25 21:00:45 +0000	[diff] [blame]	5557	else if (F.paramHasAttr(Idx, Attribute::ZExt))
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	5558	AssertOp = ISD::AssertZext;
				5559
				5560	ArgValues.push_back(getCopyFromParts(DAG, &Parts[0], NumParts, PartVT, VT,
				5561	AssertOp));
				5562	}
				5563	}
				5564	assert(i == NumArgRegs && "Argument register count mismatch!");
				5565	}
				5566
				5567
				5568	/// TargetLowering::LowerCallTo - This is the default LowerCallTo
				5569	/// implementation, which just inserts an ISD::CALL node, which is later custom
				5570	/// lowered by the target to something concrete. FIXME: When all targets are
				5571	/// migrated to using ISD::CALL, this hook should be integrated into SDISel.
				5572	std::pair<SDValue, SDValue>
				5573	TargetLowering::LowerCallTo(SDValue Chain, const Type *RetTy,
				5574	bool RetSExt, bool RetZExt, bool isVarArg,
Dale Johannesen	86098bd	2008-09-26 19:31:26 +0000	[diff] [blame]	5575	bool isInreg,
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	5576	unsigned CallingConv, bool isTailCall,
				5577	SDValue Callee,
				5578	ArgListTy &Args, SelectionDAG &DAG) {
Dan Gohman	1937e2f	2008-09-16 01:42:28 +0000	[diff] [blame]	5579	assert((!isTailCall \|\| PerformTailCallOpt) &&
				5580	"isTailCall set when tail-call optimizations are disabled!");
				5581
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	5582	SmallVector<SDValue, 32> Ops;
				5583	Ops.push_back(Chain); // Op#0 - Chain
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	5584	Ops.push_back(Callee);
				5585
				5586	// Handle all of the outgoing arguments.
				5587	for (unsigned i = 0, e = Args.size(); i != e; ++i) {
				5588	SmallVector<MVT, 4> ValueVTs;
				5589	ComputeValueVTs(*this, Args[i].Ty, ValueVTs);
				5590	for (unsigned Value = 0, NumValues = ValueVTs.size();
				5591	Value != NumValues; ++Value) {
				5592	MVT VT = ValueVTs[Value];
				5593	const Type *ArgTy = VT.getTypeForMVT();
Chris Lattner	2a0b96c	2008-10-18 18:49:30 +0000	[diff] [blame]	5594	SDValue Op = SDValue(Args[i].Node.getNode(),
				5595	Args[i].Node.getResNo() + Value);
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	5596	ISD::ArgFlagsTy Flags;
				5597	unsigned OriginalAlignment =
				5598	getTargetData()->getABITypeAlignment(ArgTy);
				5599
				5600	if (Args[i].isZExt)
				5601	Flags.setZExt();
				5602	if (Args[i].isSExt)
				5603	Flags.setSExt();
				5604	if (Args[i].isInReg)
				5605	Flags.setInReg();
				5606	if (Args[i].isSRet)
				5607	Flags.setSRet();
				5608	if (Args[i].isByVal) {
				5609	Flags.setByVal();
				5610	const PointerType *Ty = cast<PointerType>(Args[i].Ty);
				5611	const Type *ElementTy = Ty->getElementType();
				5612	unsigned FrameAlign = getByValTypeAlignment(ElementTy);
				5613	unsigned FrameSize = getTargetData()->getABITypeSize(ElementTy);
				5614	// For ByVal, alignment should come from FE. BE will guess if this
				5615	// info is not there but there are cases it cannot get right.
				5616	if (Args[i].Alignment)
				5617	FrameAlign = Args[i].Alignment;
				5618	Flags.setByValAlign(FrameAlign);
				5619	Flags.setByValSize(FrameSize);
				5620	}
				5621	if (Args[i].isNest)
				5622	Flags.setNest();
				5623	Flags.setOrigAlign(OriginalAlignment);
				5624
				5625	MVT PartVT = getRegisterType(VT);
				5626	unsigned NumParts = getNumRegisters(VT);
				5627	SmallVector<SDValue, 4> Parts(NumParts);
				5628	ISD::NodeType ExtendKind = ISD::ANY_EXTEND;
				5629
				5630	if (Args[i].isSExt)
				5631	ExtendKind = ISD::SIGN_EXTEND;
				5632	else if (Args[i].isZExt)
				5633	ExtendKind = ISD::ZERO_EXTEND;
				5634
				5635	getCopyToParts(DAG, Op, &Parts[0], NumParts, PartVT, ExtendKind);
				5636
				5637	for (unsigned i = 0; i != NumParts; ++i) {
				5638	// if it isn't first piece, alignment must be 1
				5639	ISD::ArgFlagsTy MyFlags = Flags;
				5640	if (NumParts > 1 && i == 0)
				5641	MyFlags.setSplit();
				5642	else if (i != 0)
				5643	MyFlags.setOrigAlign(1);
				5644
				5645	Ops.push_back(Parts[i]);
				5646	Ops.push_back(DAG.getArgFlags(MyFlags));
				5647	}
				5648	}
				5649	}
				5650
				5651	// Figure out the result value types. We start by making a list of
				5652	// the potentially illegal return value types.
				5653	SmallVector<MVT, 4> LoweredRetTys;
				5654	SmallVector<MVT, 4> RetTys;
				5655	ComputeValueVTs(*this, RetTy, RetTys);
				5656
				5657	// Then we translate that to a list of legal types.
				5658	for (unsigned I = 0, E = RetTys.size(); I != E; ++I) {
				5659	MVT VT = RetTys[I];
				5660	MVT RegisterVT = getRegisterType(VT);
				5661	unsigned NumRegs = getNumRegisters(VT);
				5662	for (unsigned i = 0; i != NumRegs; ++i)
				5663	LoweredRetTys.push_back(RegisterVT);
				5664	}
				5665
				5666	LoweredRetTys.push_back(MVT::Other); // Always has a chain.
				5667
				5668	// Create the CALL node.
Dale Johannesen	86098bd	2008-09-26 19:31:26 +0000	[diff] [blame]	5669	SDValue Res = DAG.getCall(CallingConv, isVarArg, isTailCall, isInreg,
Dan Gohman	095cc29	2008-09-13 01:54:27 +0000	[diff] [blame]	5670	DAG.getVTList(&LoweredRetTys[0],
				5671	LoweredRetTys.size()),
Dale Johannesen	86098bd	2008-09-26 19:31:26 +0000	[diff] [blame]	5672	&Ops[0], Ops.size()
				5673	);
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	5674	Chain = Res.getValue(LoweredRetTys.size() - 1);
				5675
				5676	// Gather up the call result into a single value.
Dan Gohman	b5cc34d	2008-10-07 00:12:37 +0000	[diff] [blame]	5677	if (RetTy != Type::VoidTy && !RetTys.empty()) {
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	5678	ISD::NodeType AssertOp = ISD::DELETED_NODE;
				5679
				5680	if (RetSExt)
				5681	AssertOp = ISD::AssertSext;
				5682	else if (RetZExt)
				5683	AssertOp = ISD::AssertZext;
				5684
				5685	SmallVector<SDValue, 4> ReturnValues;
				5686	unsigned RegNo = 0;
				5687	for (unsigned I = 0, E = RetTys.size(); I != E; ++I) {
				5688	MVT VT = RetTys[I];
				5689	MVT RegisterVT = getRegisterType(VT);
				5690	unsigned NumRegs = getNumRegisters(VT);
				5691	unsigned RegNoEnd = NumRegs + RegNo;
				5692	SmallVector<SDValue, 4> Results;
				5693	for (; RegNo != RegNoEnd; ++RegNo)
				5694	Results.push_back(Res.getValue(RegNo));
				5695	SDValue ReturnValue =
				5696	getCopyFromParts(DAG, &Results[0], NumRegs, RegisterVT, VT,
				5697	AssertOp);
				5698	ReturnValues.push_back(ReturnValue);
				5699	}
Duncan Sands	aaffa05	2008-12-01 11:41:29 +0000	[diff] [blame]	5700	Res = DAG.getNode(ISD::MERGE_VALUES,
				5701	DAG.getVTList(&RetTys[0], RetTys.size()),
				5702	&ReturnValues[0], ReturnValues.size());
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	5703	}
				5704
				5705	return std::make_pair(Res, Chain);
				5706	}
				5707
				5708	SDValue TargetLowering::LowerOperation(SDValue Op, SelectionDAG &DAG) {
				5709	assert(0 && "LowerOperation not implemented for this target!");
				5710	abort();
				5711	return SDValue();
				5712	}
				5713
				5714
				5715	void SelectionDAGLowering::CopyValueToVirtualRegister(Value *V, unsigned Reg) {
				5716	SDValue Op = getValue(V);
				5717	assert((Op.getOpcode() != ISD::CopyFromReg \|\|
				5718	cast<RegisterSDNode>(Op.getOperand(1))->getReg() != Reg) &&
				5719	"Copy from a reg to the same reg!");
				5720	assert(!TargetRegisterInfo::isPhysicalRegister(Reg) && "Is a physreg");
				5721
				5722	RegsForValue RFV(TLI, Reg, V->getType());
				5723	SDValue Chain = DAG.getEntryNode();
				5724	RFV.getCopyToRegs(Op, DAG, Chain, 0);
				5725	PendingExports.push_back(Chain);
				5726	}
				5727
				5728	#include "llvm/CodeGen/SelectionDAGISel.h"
				5729
				5730	void SelectionDAGISel::
				5731	LowerArguments(BasicBlock *LLVMBB) {
				5732	// If this is the entry block, emit arguments.
				5733	Function &F = *LLVMBB->getParent();
				5734	SDValue OldRoot = SDL->DAG.getRoot();
				5735	SmallVector<SDValue, 16> Args;
				5736	TLI.LowerArguments(F, SDL->DAG, Args);
				5737
				5738	unsigned a = 0;
				5739	for (Function::arg_iterator AI = F.arg_begin(), E = F.arg_end();
				5740	AI != E; ++AI) {
				5741	SmallVector<MVT, 4> ValueVTs;
				5742	ComputeValueVTs(TLI, AI->getType(), ValueVTs);
				5743	unsigned NumValues = ValueVTs.size();
				5744	if (!AI->use_empty()) {
				5745	SDL->setValue(AI, SDL->DAG.getMergeValues(&Args[a], NumValues));
				5746	// If this argument is live outside of the entry block, insert a copy from
				5747	// whereever we got it to the vreg that other BB's will reference it as.
				5748	DenseMap<const Value*, unsigned>::iterator VMI=FuncInfo->ValueMap.find(AI);
				5749	if (VMI != FuncInfo->ValueMap.end()) {
				5750	SDL->CopyValueToVirtualRegister(AI, VMI->second);
				5751	}
				5752	}
				5753	a += NumValues;
				5754	}
				5755
				5756	// Finally, if the target has anything special to do, allow it to do so.
				5757	// FIXME: this should insert code into the DAG!
				5758	EmitFunctionEntryCode(F, SDL->DAG.getMachineFunction());
				5759	}
				5760
				5761	/// Handle PHI nodes in successor blocks. Emit code into the SelectionDAG to
				5762	/// ensure constants are generated when needed. Remember the virtual registers
				5763	/// that need to be added to the Machine PHI nodes as input. We cannot just
				5764	/// directly add them, because expansion might result in multiple MBB's for one
				5765	/// BB. As such, the start of the BB might correspond to a different MBB than
				5766	/// the end.
				5767	///
				5768	void
				5769	SelectionDAGISel::HandlePHINodesInSuccessorBlocks(BasicBlock *LLVMBB) {
				5770	TerminatorInst *TI = LLVMBB->getTerminator();
				5771
				5772	SmallPtrSet<MachineBasicBlock *, 4> SuccsHandled;
				5773
				5774	// Check successor nodes' PHI nodes that expect a constant to be available
				5775	// from this block.
				5776	for (unsigned succ = 0, e = TI->getNumSuccessors(); succ != e; ++succ) {
				5777	BasicBlock *SuccBB = TI->getSuccessor(succ);
				5778	if (!isa<PHINode>(SuccBB->begin())) continue;
				5779	MachineBasicBlock *SuccMBB = FuncInfo->MBBMap[SuccBB];
				5780
				5781	// If this terminator has multiple identical successors (common for
				5782	// switches), only handle each succ once.
				5783	if (!SuccsHandled.insert(SuccMBB)) continue;
				5784
				5785	MachineBasicBlock::iterator MBBI = SuccMBB->begin();
				5786	PHINode *PN;
				5787
				5788	// At this point we know that there is a 1-1 correspondence between LLVM PHI
				5789	// nodes and Machine PHI nodes, but the incoming operands have not been
				5790	// emitted yet.
				5791	for (BasicBlock::iterator I = SuccBB->begin();
				5792	(PN = dyn_cast<PHINode>(I)); ++I) {
				5793	// Ignore dead phi's.
				5794	if (PN->use_empty()) continue;
				5795
				5796	unsigned Reg;
				5797	Value *PHIOp = PN->getIncomingValueForBlock(LLVMBB);
				5798
				5799	if (Constant *C = dyn_cast<Constant>(PHIOp)) {
				5800	unsigned &RegOut = SDL->ConstantsOut[C];
				5801	if (RegOut == 0) {
				5802	RegOut = FuncInfo->CreateRegForValue(C);
				5803	SDL->CopyValueToVirtualRegister(C, RegOut);
				5804	}
				5805	Reg = RegOut;
				5806	} else {
				5807	Reg = FuncInfo->ValueMap[PHIOp];
				5808	if (Reg == 0) {
				5809	assert(isa<AllocaInst>(PHIOp) &&
				5810	FuncInfo->StaticAllocaMap.count(cast<AllocaInst>(PHIOp)) &&
				5811	"Didn't codegen value into a register!??");
				5812	Reg = FuncInfo->CreateRegForValue(PHIOp);
				5813	SDL->CopyValueToVirtualRegister(PHIOp, Reg);
				5814	}
				5815	}
				5816
				5817	// Remember that this register needs to added to the machine PHI node as
				5818	// the input for this MBB.
				5819	SmallVector<MVT, 4> ValueVTs;
				5820	ComputeValueVTs(TLI, PN->getType(), ValueVTs);
				5821	for (unsigned vti = 0, vte = ValueVTs.size(); vti != vte; ++vti) {
				5822	MVT VT = ValueVTs[vti];
				5823	unsigned NumRegisters = TLI.getNumRegisters(VT);
				5824	for (unsigned i = 0, e = NumRegisters; i != e; ++i)
				5825	SDL->PHINodesToUpdate.push_back(std::make_pair(MBBI++, Reg+i));
				5826	Reg += NumRegisters;
				5827	}
				5828	}
				5829	}
				5830	SDL->ConstantsOut.clear();
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	5831	}
				5832
Dan Gohman	3df24e6	2008-09-03 23:12:08 +0000	[diff] [blame]	5833	/// This is the Fast-ISel version of HandlePHINodesInSuccessorBlocks. It only
				5834	/// supports legal types, and it emits MachineInstrs directly instead of
				5835	/// creating SelectionDAG nodes.
				5836	///
				5837	bool
				5838	SelectionDAGISel::HandlePHINodesInSuccessorBlocksFast(BasicBlock *LLVMBB,
				5839	FastISel *F) {
				5840	TerminatorInst *TI = LLVMBB->getTerminator();
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	5841
Dan Gohman	3df24e6	2008-09-03 23:12:08 +0000	[diff] [blame]	5842	SmallPtrSet<MachineBasicBlock *, 4> SuccsHandled;
				5843	unsigned OrigNumPHINodesToUpdate = SDL->PHINodesToUpdate.size();
				5844
				5845	// Check successor nodes' PHI nodes that expect a constant to be available
				5846	// from this block.
				5847	for (unsigned succ = 0, e = TI->getNumSuccessors(); succ != e; ++succ) {
				5848	BasicBlock *SuccBB = TI->getSuccessor(succ);
				5849	if (!isa<PHINode>(SuccBB->begin())) continue;
				5850	MachineBasicBlock *SuccMBB = FuncInfo->MBBMap[SuccBB];
				5851
				5852	// If this terminator has multiple identical successors (common for
				5853	// switches), only handle each succ once.
				5854	if (!SuccsHandled.insert(SuccMBB)) continue;
				5855
				5856	MachineBasicBlock::iterator MBBI = SuccMBB->begin();
				5857	PHINode *PN;
				5858
				5859	// At this point we know that there is a 1-1 correspondence between LLVM PHI
				5860	// nodes and Machine PHI nodes, but the incoming operands have not been
				5861	// emitted yet.
				5862	for (BasicBlock::iterator I = SuccBB->begin();
				5863	(PN = dyn_cast<PHINode>(I)); ++I) {
				5864	// Ignore dead phi's.
				5865	if (PN->use_empty()) continue;
				5866
				5867	// Only handle legal types. Two interesting things to note here. First,
				5868	// by bailing out early, we may leave behind some dead instructions,
				5869	// since SelectionDAG's HandlePHINodesInSuccessorBlocks will insert its
				5870	// own moves. Second, this check is necessary becuase FastISel doesn't
				5871	// use CreateRegForValue to create registers, so it always creates
				5872	// exactly one register for each non-void instruction.
				5873	MVT VT = TLI.getValueType(PN->getType(), /AllowUnknown=/true);
				5874	if (VT == MVT::Other \|\| !TLI.isTypeLegal(VT)) {
Dan Gohman	74321ab	2008-09-10 21:01:31 +0000	[diff] [blame]	5875	// Promote MVT::i1.
				5876	if (VT == MVT::i1)
				5877	VT = TLI.getTypeToTransformTo(VT);
				5878	else {
				5879	SDL->PHINodesToUpdate.resize(OrigNumPHINodesToUpdate);
				5880	return false;
				5881	}
Dan Gohman	3df24e6	2008-09-03 23:12:08 +0000	[diff] [blame]	5882	}
				5883
				5884	Value *PHIOp = PN->getIncomingValueForBlock(LLVMBB);
				5885
				5886	unsigned Reg = F->getRegForValue(PHIOp);
				5887	if (Reg == 0) {
				5888	SDL->PHINodesToUpdate.resize(OrigNumPHINodesToUpdate);
				5889	return false;
				5890	}
				5891	SDL->PHINodesToUpdate.push_back(std::make_pair(MBBI++, Reg));
				5892	}
				5893	}
				5894
				5895	return true;
				5896	}