Blame - lib/CodeGen/SelectionDAG/SelectionDAGBuild.cpp - platform/external/llvm

blob: c7e2cd5caba4bda29cfe2d422672741d523697b8 [file] [log] [blame]

Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	1	//===-- SelectionDAGBuild.cpp - Selection-DAG building --------------------===//
				2	//
				3	// The LLVM Compiler Infrastructure
				4	//
				5	// This file is distributed under the University of Illinois Open Source
				6	// License. See LICENSE.TXT for details.
				7	//
				8	//===----------------------------------------------------------------------===//
				9	//
				10	// This implements routines for translating from LLVM IR into SelectionDAG IR.
				11	//
				12	//===----------------------------------------------------------------------===//
				13
				14	#define DEBUG_TYPE "isel"
				15	#include "SelectionDAGBuild.h"
				16	#include "llvm/ADT/BitVector.h"
Dan Gohman	5b22980	2008-09-04 20:49:27 +0000	[diff] [blame]	17	#include "llvm/ADT/SmallSet.h"
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	18	#include "llvm/Analysis/AliasAnalysis.h"
				19	#include "llvm/Constants.h"
				20	#include "llvm/CallingConv.h"
				21	#include "llvm/DerivedTypes.h"
				22	#include "llvm/Function.h"
				23	#include "llvm/GlobalVariable.h"
				24	#include "llvm/InlineAsm.h"
				25	#include "llvm/Instructions.h"
				26	#include "llvm/Intrinsics.h"
				27	#include "llvm/IntrinsicInst.h"
				28	#include "llvm/ParameterAttributes.h"
				29	#include "llvm/CodeGen/FastISel.h"
				30	#include "llvm/CodeGen/GCStrategy.h"
				31	#include "llvm/CodeGen/GCMetadata.h"
				32	#include "llvm/CodeGen/MachineFunction.h"
				33	#include "llvm/CodeGen/MachineFrameInfo.h"
				34	#include "llvm/CodeGen/MachineInstrBuilder.h"
				35	#include "llvm/CodeGen/MachineJumpTableInfo.h"
				36	#include "llvm/CodeGen/MachineModuleInfo.h"
				37	#include "llvm/CodeGen/MachineRegisterInfo.h"
				38	#include "llvm/CodeGen/SelectionDAG.h"
				39	#include "llvm/Target/TargetRegisterInfo.h"
				40	#include "llvm/Target/TargetData.h"
				41	#include "llvm/Target/TargetFrameInfo.h"
				42	#include "llvm/Target/TargetInstrInfo.h"
				43	#include "llvm/Target/TargetLowering.h"
				44	#include "llvm/Target/TargetMachine.h"
				45	#include "llvm/Target/TargetOptions.h"
				46	#include "llvm/Support/Compiler.h"
				47	#include "llvm/Support/Debug.h"
				48	#include "llvm/Support/MathExtras.h"
				49	#include <algorithm>
				50	using namespace llvm;
				51
Dale Johannesen	601d3c0	2008-09-05 01:48:15 +0000	[diff] [blame]	52	/// LimitFloatPrecision - Generate low-precision inline sequences for
				53	/// some float libcalls (6, 8 or 12 bits).
				54	static unsigned LimitFloatPrecision;
				55
				56	static cl::opt<unsigned, true>
				57	LimitFPPrecision("limit-float-precision",
				58	cl::desc("Generate low-precision inline sequences "
				59	"for some float libcalls"),
				60	cl::location(LimitFloatPrecision),
				61	cl::init(0));
				62
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	63	/// ComputeLinearIndex - Given an LLVM IR aggregate type and a sequence
				64	/// insertvalue or extractvalue indices that identify a member, return
				65	/// the linearized index of the start of the member.
				66	///
				67	static unsigned ComputeLinearIndex(const TargetLowering &TLI, const Type *Ty,
				68	const unsigned *Indices,
				69	const unsigned *IndicesEnd,
				70	unsigned CurIndex = 0) {
				71	// Base case: We're done.
				72	if (Indices && Indices == IndicesEnd)
				73	return CurIndex;
				74
				75	// Given a struct type, recursively traverse the elements.
				76	if (const StructType *STy = dyn_cast<StructType>(Ty)) {
				77	for (StructType::element_iterator EB = STy->element_begin(),
				78	EI = EB,
				79	EE = STy->element_end();
				80	EI != EE; ++EI) {
				81	if (Indices && *Indices == unsigned(EI - EB))
				82	return ComputeLinearIndex(TLI, *EI, Indices+1, IndicesEnd, CurIndex);
				83	CurIndex = ComputeLinearIndex(TLI, *EI, 0, 0, CurIndex);
				84	}
				85	}
				86	// Given an array type, recursively traverse the elements.
				87	else if (const ArrayType *ATy = dyn_cast<ArrayType>(Ty)) {
				88	const Type *EltTy = ATy->getElementType();
				89	for (unsigned i = 0, e = ATy->getNumElements(); i != e; ++i) {
				90	if (Indices && *Indices == i)
				91	return ComputeLinearIndex(TLI, EltTy, Indices+1, IndicesEnd, CurIndex);
				92	CurIndex = ComputeLinearIndex(TLI, EltTy, 0, 0, CurIndex);
				93	}
				94	}
				95	// We haven't found the type we're looking for, so keep searching.
				96	return CurIndex + 1;
				97	}
				98
				99	/// ComputeValueVTs - Given an LLVM IR type, compute a sequence of
				100	/// MVTs that represent all the individual underlying
				101	/// non-aggregate types that comprise it.
				102	///
				103	/// If Offsets is non-null, it points to a vector to be filled in
				104	/// with the in-memory offsets of each of the individual values.
				105	///
				106	static void ComputeValueVTs(const TargetLowering &TLI, const Type *Ty,
				107	SmallVectorImpl<MVT> &ValueVTs,
				108	SmallVectorImpl<uint64_t> *Offsets = 0,
				109	uint64_t StartingOffset = 0) {
				110	// Given a struct type, recursively traverse the elements.
				111	if (const StructType *STy = dyn_cast<StructType>(Ty)) {
				112	const StructLayout *SL = TLI.getTargetData()->getStructLayout(STy);
				113	for (StructType::element_iterator EB = STy->element_begin(),
				114	EI = EB,
				115	EE = STy->element_end();
				116	EI != EE; ++EI)
				117	ComputeValueVTs(TLI, *EI, ValueVTs, Offsets,
				118	StartingOffset + SL->getElementOffset(EI - EB));
				119	return;
				120	}
				121	// Given an array type, recursively traverse the elements.
				122	if (const ArrayType *ATy = dyn_cast<ArrayType>(Ty)) {
				123	const Type *EltTy = ATy->getElementType();
				124	uint64_t EltSize = TLI.getTargetData()->getABITypeSize(EltTy);
				125	for (unsigned i = 0, e = ATy->getNumElements(); i != e; ++i)
				126	ComputeValueVTs(TLI, EltTy, ValueVTs, Offsets,
				127	StartingOffset + i * EltSize);
				128	return;
				129	}
				130	// Base case: we can get an MVT for this LLVM IR type.
				131	ValueVTs.push_back(TLI.getValueType(Ty));
				132	if (Offsets)
				133	Offsets->push_back(StartingOffset);
				134	}
				135
Dan Gohman	2a7c671	2008-09-03 23:18:39 +0000	[diff] [blame]	136	namespace llvm {
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	137	/// RegsForValue - This struct represents the registers (physical or virtual)
				138	/// that a particular set of values is assigned, and the type information about
				139	/// the value. The most common situation is to represent one value at a time,
				140	/// but struct or array values are handled element-wise as multiple values.
				141	/// The splitting of aggregates is performed recursively, so that we never
				142	/// have aggregate-typed registers. The values at this point do not necessarily
				143	/// have legal types, so each value may require one or more registers of some
				144	/// legal type.
				145	///
				146	struct VISIBILITY_HIDDEN RegsForValue {
				147	/// TLI - The TargetLowering object.
				148	///
				149	const TargetLowering *TLI;
				150
				151	/// ValueVTs - The value types of the values, which may not be legal, and
				152	/// may need be promoted or synthesized from one or more registers.
				153	///
				154	SmallVector<MVT, 4> ValueVTs;
				155
				156	/// RegVTs - The value types of the registers. This is the same size as
				157	/// ValueVTs and it records, for each value, what the type of the assigned
				158	/// register or registers are. (Individual values are never synthesized
				159	/// from more than one type of register.)
				160	///
				161	/// With virtual registers, the contents of RegVTs is redundant with TLI's
				162	/// getRegisterType member function, however when with physical registers
				163	/// it is necessary to have a separate record of the types.
				164	///
				165	SmallVector<MVT, 4> RegVTs;
				166
				167	/// Regs - This list holds the registers assigned to the values.
				168	/// Each legal or promoted value requires one register, and each
				169	/// expanded value requires multiple registers.
				170	///
				171	SmallVector<unsigned, 4> Regs;
				172
				173	RegsForValue() : TLI(0) {}
				174
				175	RegsForValue(const TargetLowering &tli,
				176	const SmallVector<unsigned, 4> &regs,
				177	MVT regvt, MVT valuevt)
				178	: TLI(&tli), ValueVTs(1, valuevt), RegVTs(1, regvt), Regs(regs) {}
				179	RegsForValue(const TargetLowering &tli,
				180	const SmallVector<unsigned, 4> &regs,
				181	const SmallVector<MVT, 4> &regvts,
				182	const SmallVector<MVT, 4> &valuevts)
				183	: TLI(&tli), ValueVTs(valuevts), RegVTs(regvts), Regs(regs) {}
				184	RegsForValue(const TargetLowering &tli,
				185	unsigned Reg, const Type *Ty) : TLI(&tli) {
				186	ComputeValueVTs(tli, Ty, ValueVTs);
				187
				188	for (unsigned Value = 0, e = ValueVTs.size(); Value != e; ++Value) {
				189	MVT ValueVT = ValueVTs[Value];
				190	unsigned NumRegs = TLI->getNumRegisters(ValueVT);
				191	MVT RegisterVT = TLI->getRegisterType(ValueVT);
				192	for (unsigned i = 0; i != NumRegs; ++i)
				193	Regs.push_back(Reg + i);
				194	RegVTs.push_back(RegisterVT);
				195	Reg += NumRegs;
				196	}
				197	}
				198
				199	/// append - Add the specified values to this one.
				200	void append(const RegsForValue &RHS) {
				201	TLI = RHS.TLI;
				202	ValueVTs.append(RHS.ValueVTs.begin(), RHS.ValueVTs.end());
				203	RegVTs.append(RHS.RegVTs.begin(), RHS.RegVTs.end());
				204	Regs.append(RHS.Regs.begin(), RHS.Regs.end());
				205	}
				206
				207
				208	/// getCopyFromRegs - Emit a series of CopyFromReg nodes that copies from
				209	/// this value and returns the result as a ValueVTs value. This uses
				210	/// Chain/Flag as the input and updates them for the output Chain/Flag.
				211	/// If the Flag pointer is NULL, no flag is used.
				212	SDValue getCopyFromRegs(SelectionDAG &DAG,
				213	SDValue &Chain, SDValue *Flag) const;
				214
				215	/// getCopyToRegs - Emit a series of CopyToReg nodes that copies the
				216	/// specified value into the registers specified by this object. This uses
				217	/// Chain/Flag as the input and updates them for the output Chain/Flag.
				218	/// If the Flag pointer is NULL, no flag is used.
				219	void getCopyToRegs(SDValue Val, SelectionDAG &DAG,
				220	SDValue &Chain, SDValue *Flag) const;
				221
				222	/// AddInlineAsmOperands - Add this value to the specified inlineasm node
				223	/// operand list. This adds the code marker and includes the number of
				224	/// values added into it.
				225	void AddInlineAsmOperands(unsigned Code, SelectionDAG &DAG,
				226	std::vector<SDValue> &Ops) const;
				227	};
				228	}
				229
				230	/// isUsedOutsideOfDefiningBlock - Return true if this instruction is used by
				231	/// PHI nodes or outside of the basic block that defines it, or used by a
				232	/// switch or atomic instruction, which may expand to multiple basic blocks.
				233	static bool isUsedOutsideOfDefiningBlock(Instruction *I) {
				234	if (isa<PHINode>(I)) return true;
				235	BasicBlock *BB = I->getParent();
				236	for (Value::use_iterator UI = I->use_begin(), E = I->use_end(); UI != E; ++UI)
				237	if (cast<Instruction>(UI)->getParent() != BB \|\| isa<PHINode>(UI) \|\|
				238	// FIXME: Remove switchinst special case.
				239	isa<SwitchInst>(*UI))
				240	return true;
				241	return false;
				242	}
				243
				244	/// isOnlyUsedInEntryBlock - If the specified argument is only used in the
				245	/// entry block, return true. This includes arguments used by switches, since
				246	/// the switch may expand into multiple basic blocks.
				247	static bool isOnlyUsedInEntryBlock(Argument *A, bool EnableFastISel) {
				248	// With FastISel active, we may be splitting blocks, so force creation
				249	// of virtual registers for all non-dead arguments.
				250	if (EnableFastISel)
				251	return A->use_empty();
				252
				253	BasicBlock *Entry = A->getParent()->begin();
				254	for (Value::use_iterator UI = A->use_begin(), E = A->use_end(); UI != E; ++UI)
				255	if (cast<Instruction>(UI)->getParent() != Entry \|\| isa<SwitchInst>(UI))
				256	return false; // Use not in entry block.
				257	return true;
				258	}
				259
				260	FunctionLoweringInfo::FunctionLoweringInfo(TargetLowering &tli)
				261	: TLI(tli) {
				262	}
				263
				264	void FunctionLoweringInfo::set(Function &fn, MachineFunction &mf,
				265	bool EnableFastISel) {
				266	Fn = &fn;
				267	MF = &mf;
				268	RegInfo = &MF->getRegInfo();
				269
				270	// Create a vreg for each argument register that is not dead and is used
				271	// outside of the entry block for the function.
				272	for (Function::arg_iterator AI = Fn->arg_begin(), E = Fn->arg_end();
				273	AI != E; ++AI)
				274	if (!isOnlyUsedInEntryBlock(AI, EnableFastISel))
				275	InitializeRegForValue(AI);
				276
				277	// Initialize the mapping of values to registers. This is only set up for
				278	// instruction values that are used outside of the block that defines
				279	// them.
				280	Function::iterator BB = Fn->begin(), EB = Fn->end();
				281	for (BasicBlock::iterator I = BB->begin(), E = BB->end(); I != E; ++I)
				282	if (AllocaInst *AI = dyn_cast<AllocaInst>(I))
				283	if (ConstantInt *CUI = dyn_cast<ConstantInt>(AI->getArraySize())) {
				284	const Type *Ty = AI->getAllocatedType();
				285	uint64_t TySize = TLI.getTargetData()->getABITypeSize(Ty);
				286	unsigned Align =
				287	std::max((unsigned)TLI.getTargetData()->getPrefTypeAlignment(Ty),
				288	AI->getAlignment());
				289
				290	TySize *= CUI->getZExtValue(); // Get total allocated size.
				291	if (TySize == 0) TySize = 1; // Don't create zero-sized stack objects.
				292	StaticAllocaMap[AI] =
				293	MF->getFrameInfo()->CreateStackObject(TySize, Align);
				294	}
				295
				296	for (; BB != EB; ++BB)
				297	for (BasicBlock::iterator I = BB->begin(), E = BB->end(); I != E; ++I)
				298	if (!I->use_empty() && isUsedOutsideOfDefiningBlock(I))
				299	if (!isa<AllocaInst>(I) \|\|
				300	!StaticAllocaMap.count(cast<AllocaInst>(I)))
				301	InitializeRegForValue(I);
				302
				303	// Create an initial MachineBasicBlock for each LLVM BasicBlock in F. This
				304	// also creates the initial PHI MachineInstrs, though none of the input
				305	// operands are populated.
				306	for (BB = Fn->begin(), EB = Fn->end(); BB != EB; ++BB) {
				307	MachineBasicBlock *MBB = mf.CreateMachineBasicBlock(BB);
				308	MBBMap[BB] = MBB;
				309	MF->push_back(MBB);
				310
				311	// Create Machine PHI nodes for LLVM PHI nodes, lowering them as
				312	// appropriate.
				313	PHINode *PN;
				314	for (BasicBlock::iterator I = BB->begin();(PN = dyn_cast<PHINode>(I)); ++I){
				315	if (PN->use_empty()) continue;
				316
				317	unsigned PHIReg = ValueMap[PN];
				318	assert(PHIReg && "PHI node does not have an assigned virtual register!");
				319
				320	SmallVector<MVT, 4> ValueVTs;
				321	ComputeValueVTs(TLI, PN->getType(), ValueVTs);
				322	for (unsigned vti = 0, vte = ValueVTs.size(); vti != vte; ++vti) {
				323	MVT VT = ValueVTs[vti];
				324	unsigned NumRegisters = TLI.getNumRegisters(VT);
Dan Gohman	6448d91	2008-09-04 15:39:15 +0000	[diff] [blame]	325	const TargetInstrInfo *TII = MF->getTarget().getInstrInfo();
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	326	for (unsigned i = 0; i != NumRegisters; ++i)
				327	BuildMI(MBB, TII->get(TargetInstrInfo::PHI), PHIReg+i);
				328	PHIReg += NumRegisters;
				329	}
				330	}
				331	}
				332	}
				333
				334	unsigned FunctionLoweringInfo::MakeReg(MVT VT) {
				335	return RegInfo->createVirtualRegister(TLI.getRegClassFor(VT));
				336	}
				337
				338	/// CreateRegForValue - Allocate the appropriate number of virtual registers of
				339	/// the correctly promoted or expanded types. Assign these registers
				340	/// consecutive vreg numbers and return the first assigned number.
				341	///
				342	/// In the case that the given value has struct or array type, this function
				343	/// will assign registers for each member or element.
				344	///
				345	unsigned FunctionLoweringInfo::CreateRegForValue(const Value *V) {
				346	SmallVector<MVT, 4> ValueVTs;
				347	ComputeValueVTs(TLI, V->getType(), ValueVTs);
				348
				349	unsigned FirstReg = 0;
				350	for (unsigned Value = 0, e = ValueVTs.size(); Value != e; ++Value) {
				351	MVT ValueVT = ValueVTs[Value];
				352	MVT RegisterVT = TLI.getRegisterType(ValueVT);
				353
				354	unsigned NumRegs = TLI.getNumRegisters(ValueVT);
				355	for (unsigned i = 0; i != NumRegs; ++i) {
				356	unsigned R = MakeReg(RegisterVT);
				357	if (!FirstReg) FirstReg = R;
				358	}
				359	}
				360	return FirstReg;
				361	}
				362
				363	/// getCopyFromParts - Create a value that contains the specified legal parts
				364	/// combined into the value they represent. If the parts combine to a type
				365	/// larger then ValueVT then AssertOp can be used to specify whether the extra
				366	/// bits are known to be zero (ISD::AssertZext) or sign extended from ValueVT
				367	/// (ISD::AssertSext).
				368	static SDValue getCopyFromParts(SelectionDAG &DAG,
				369	const SDValue *Parts,
				370	unsigned NumParts,
				371	MVT PartVT,
				372	MVT ValueVT,
				373	ISD::NodeType AssertOp = ISD::DELETED_NODE) {
				374	assert(NumParts > 0 && "No parts to assemble!");
				375	TargetLowering &TLI = DAG.getTargetLoweringInfo();
				376	SDValue Val = Parts[0];
				377
				378	if (NumParts > 1) {
				379	// Assemble the value from multiple parts.
				380	if (!ValueVT.isVector()) {
				381	unsigned PartBits = PartVT.getSizeInBits();
				382	unsigned ValueBits = ValueVT.getSizeInBits();
				383
				384	// Assemble the power of 2 part.
				385	unsigned RoundParts = NumParts & (NumParts - 1) ?
				386	1 << Log2_32(NumParts) : NumParts;
				387	unsigned RoundBits = PartBits * RoundParts;
				388	MVT RoundVT = RoundBits == ValueBits ?
				389	ValueVT : MVT::getIntegerVT(RoundBits);
				390	SDValue Lo, Hi;
				391
				392	if (RoundParts > 2) {
				393	MVT HalfVT = MVT::getIntegerVT(RoundBits/2);
				394	Lo = getCopyFromParts(DAG, Parts, RoundParts/2, PartVT, HalfVT);
				395	Hi = getCopyFromParts(DAG, Parts+RoundParts/2, RoundParts/2,
				396	PartVT, HalfVT);
				397	} else {
				398	Lo = Parts[0];
				399	Hi = Parts[1];
				400	}
				401	if (TLI.isBigEndian())
				402	std::swap(Lo, Hi);
				403	Val = DAG.getNode(ISD::BUILD_PAIR, RoundVT, Lo, Hi);
				404
				405	if (RoundParts < NumParts) {
				406	// Assemble the trailing non-power-of-2 part.
				407	unsigned OddParts = NumParts - RoundParts;
				408	MVT OddVT = MVT::getIntegerVT(OddParts * PartBits);
				409	Hi = getCopyFromParts(DAG, Parts+RoundParts, OddParts, PartVT, OddVT);
				410
				411	// Combine the round and odd parts.
				412	Lo = Val;
				413	if (TLI.isBigEndian())
				414	std::swap(Lo, Hi);
				415	MVT TotalVT = MVT::getIntegerVT(NumParts * PartBits);
				416	Hi = DAG.getNode(ISD::ANY_EXTEND, TotalVT, Hi);
				417	Hi = DAG.getNode(ISD::SHL, TotalVT, Hi,
				418	DAG.getConstant(Lo.getValueType().getSizeInBits(),
				419	TLI.getShiftAmountTy()));
				420	Lo = DAG.getNode(ISD::ZERO_EXTEND, TotalVT, Lo);
				421	Val = DAG.getNode(ISD::OR, TotalVT, Lo, Hi);
				422	}
				423	} else {
				424	// Handle a multi-element vector.
				425	MVT IntermediateVT, RegisterVT;
				426	unsigned NumIntermediates;
				427	unsigned NumRegs =
				428	TLI.getVectorTypeBreakdown(ValueVT, IntermediateVT, NumIntermediates,
				429	RegisterVT);
				430	assert(NumRegs == NumParts && "Part count doesn't match vector breakdown!");
				431	NumParts = NumRegs; // Silence a compiler warning.
				432	assert(RegisterVT == PartVT && "Part type doesn't match vector breakdown!");
				433	assert(RegisterVT == Parts[0].getValueType() &&
				434	"Part type doesn't match part!");
				435
				436	// Assemble the parts into intermediate operands.
				437	SmallVector<SDValue, 8> Ops(NumIntermediates);
				438	if (NumIntermediates == NumParts) {
				439	// If the register was not expanded, truncate or copy the value,
				440	// as appropriate.
				441	for (unsigned i = 0; i != NumParts; ++i)
				442	Ops[i] = getCopyFromParts(DAG, &Parts[i], 1,
				443	PartVT, IntermediateVT);
				444	} else if (NumParts > 0) {
				445	// If the intermediate type was expanded, build the intermediate operands
				446	// from the parts.
				447	assert(NumParts % NumIntermediates == 0 &&
				448	"Must expand into a divisible number of parts!");
				449	unsigned Factor = NumParts / NumIntermediates;
				450	for (unsigned i = 0; i != NumIntermediates; ++i)
				451	Ops[i] = getCopyFromParts(DAG, &Parts[i * Factor], Factor,
				452	PartVT, IntermediateVT);
				453	}
				454
				455	// Build a vector with BUILD_VECTOR or CONCAT_VECTORS from the intermediate
				456	// operands.
				457	Val = DAG.getNode(IntermediateVT.isVector() ?
				458	ISD::CONCAT_VECTORS : ISD::BUILD_VECTOR,
				459	ValueVT, &Ops[0], NumIntermediates);
				460	}
				461	}
				462
				463	// There is now one part, held in Val. Correct it to match ValueVT.
				464	PartVT = Val.getValueType();
				465
				466	if (PartVT == ValueVT)
				467	return Val;
				468
				469	if (PartVT.isVector()) {
				470	assert(ValueVT.isVector() && "Unknown vector conversion!");
				471	return DAG.getNode(ISD::BIT_CONVERT, ValueVT, Val);
				472	}
				473
				474	if (ValueVT.isVector()) {
				475	assert(ValueVT.getVectorElementType() == PartVT &&
				476	ValueVT.getVectorNumElements() == 1 &&
				477	"Only trivial scalar-to-vector conversions should get here!");
				478	return DAG.getNode(ISD::BUILD_VECTOR, ValueVT, Val);
				479	}
				480
				481	if (PartVT.isInteger() &&
				482	ValueVT.isInteger()) {
				483	if (ValueVT.bitsLT(PartVT)) {
				484	// For a truncate, see if we have any information to
				485	// indicate whether the truncated bits will always be
				486	// zero or sign-extension.
				487	if (AssertOp != ISD::DELETED_NODE)
				488	Val = DAG.getNode(AssertOp, PartVT, Val,
				489	DAG.getValueType(ValueVT));
				490	return DAG.getNode(ISD::TRUNCATE, ValueVT, Val);
				491	} else {
				492	return DAG.getNode(ISD::ANY_EXTEND, ValueVT, Val);
				493	}
				494	}
				495
				496	if (PartVT.isFloatingPoint() && ValueVT.isFloatingPoint()) {
				497	if (ValueVT.bitsLT(Val.getValueType()))
				498	// FP_ROUND's are always exact here.
				499	return DAG.getNode(ISD::FP_ROUND, ValueVT, Val,
				500	DAG.getIntPtrConstant(1));
				501	return DAG.getNode(ISD::FP_EXTEND, ValueVT, Val);
				502	}
				503
				504	if (PartVT.getSizeInBits() == ValueVT.getSizeInBits())
				505	return DAG.getNode(ISD::BIT_CONVERT, ValueVT, Val);
				506
				507	assert(0 && "Unknown mismatch!");
				508	return SDValue();
				509	}
				510
				511	/// getCopyToParts - Create a series of nodes that contain the specified value
				512	/// split into legal parts. If the parts contain more bits than Val, then, for
				513	/// integers, ExtendKind can be used to specify how to generate the extra bits.
				514	static void getCopyToParts(SelectionDAG &DAG,
				515	SDValue Val,
				516	SDValue *Parts,
				517	unsigned NumParts,
				518	MVT PartVT,
				519	ISD::NodeType ExtendKind = ISD::ANY_EXTEND) {
				520	TargetLowering &TLI = DAG.getTargetLoweringInfo();
				521	MVT PtrVT = TLI.getPointerTy();
				522	MVT ValueVT = Val.getValueType();
				523	unsigned PartBits = PartVT.getSizeInBits();
				524	assert(TLI.isTypeLegal(PartVT) && "Copying to an illegal type!");
				525
				526	if (!NumParts)
				527	return;
				528
				529	if (!ValueVT.isVector()) {
				530	if (PartVT == ValueVT) {
				531	assert(NumParts == 1 && "No-op copy with multiple parts!");
				532	Parts[0] = Val;
				533	return;
				534	}
				535
				536	if (NumParts * PartBits > ValueVT.getSizeInBits()) {
				537	// If the parts cover more bits than the value has, promote the value.
				538	if (PartVT.isFloatingPoint() && ValueVT.isFloatingPoint()) {
				539	assert(NumParts == 1 && "Do not know what to promote to!");
				540	Val = DAG.getNode(ISD::FP_EXTEND, PartVT, Val);
				541	} else if (PartVT.isInteger() && ValueVT.isInteger()) {
				542	ValueVT = MVT::getIntegerVT(NumParts * PartBits);
				543	Val = DAG.getNode(ExtendKind, ValueVT, Val);
				544	} else {
				545	assert(0 && "Unknown mismatch!");
				546	}
				547	} else if (PartBits == ValueVT.getSizeInBits()) {
				548	// Different types of the same size.
				549	assert(NumParts == 1 && PartVT != ValueVT);
				550	Val = DAG.getNode(ISD::BIT_CONVERT, PartVT, Val);
				551	} else if (NumParts * PartBits < ValueVT.getSizeInBits()) {
				552	// If the parts cover less bits than value has, truncate the value.
				553	if (PartVT.isInteger() && ValueVT.isInteger()) {
				554	ValueVT = MVT::getIntegerVT(NumParts * PartBits);
				555	Val = DAG.getNode(ISD::TRUNCATE, ValueVT, Val);
				556	} else {
				557	assert(0 && "Unknown mismatch!");
				558	}
				559	}
				560
				561	// The value may have changed - recompute ValueVT.
				562	ValueVT = Val.getValueType();
				563	assert(NumParts * PartBits == ValueVT.getSizeInBits() &&
				564	"Failed to tile the value with PartVT!");
				565
				566	if (NumParts == 1) {
				567	assert(PartVT == ValueVT && "Type conversion failed!");
				568	Parts[0] = Val;
				569	return;
				570	}
				571
				572	// Expand the value into multiple parts.
				573	if (NumParts & (NumParts - 1)) {
				574	// The number of parts is not a power of 2. Split off and copy the tail.
				575	assert(PartVT.isInteger() && ValueVT.isInteger() &&
				576	"Do not know what to expand to!");
				577	unsigned RoundParts = 1 << Log2_32(NumParts);
				578	unsigned RoundBits = RoundParts * PartBits;
				579	unsigned OddParts = NumParts - RoundParts;
				580	SDValue OddVal = DAG.getNode(ISD::SRL, ValueVT, Val,
				581	DAG.getConstant(RoundBits,
				582	TLI.getShiftAmountTy()));
				583	getCopyToParts(DAG, OddVal, Parts + RoundParts, OddParts, PartVT);
				584	if (TLI.isBigEndian())
				585	// The odd parts were reversed by getCopyToParts - unreverse them.
				586	std::reverse(Parts + RoundParts, Parts + NumParts);
				587	NumParts = RoundParts;
				588	ValueVT = MVT::getIntegerVT(NumParts * PartBits);
				589	Val = DAG.getNode(ISD::TRUNCATE, ValueVT, Val);
				590	}
				591
				592	// The number of parts is a power of 2. Repeatedly bisect the value using
				593	// EXTRACT_ELEMENT.
				594	Parts[0] = DAG.getNode(ISD::BIT_CONVERT,
				595	MVT::getIntegerVT(ValueVT.getSizeInBits()),
				596	Val);
				597	for (unsigned StepSize = NumParts; StepSize > 1; StepSize /= 2) {
				598	for (unsigned i = 0; i < NumParts; i += StepSize) {
				599	unsigned ThisBits = StepSize * PartBits / 2;
				600	MVT ThisVT = MVT::getIntegerVT (ThisBits);
				601	SDValue &Part0 = Parts[i];
				602	SDValue &Part1 = Parts[i+StepSize/2];
				603
				604	Part1 = DAG.getNode(ISD::EXTRACT_ELEMENT, ThisVT, Part0,
				605	DAG.getConstant(1, PtrVT));
				606	Part0 = DAG.getNode(ISD::EXTRACT_ELEMENT, ThisVT, Part0,
				607	DAG.getConstant(0, PtrVT));
				608
				609	if (ThisBits == PartBits && ThisVT != PartVT) {
				610	Part0 = DAG.getNode(ISD::BIT_CONVERT, PartVT, Part0);
				611	Part1 = DAG.getNode(ISD::BIT_CONVERT, PartVT, Part1);
				612	}
				613	}
				614	}
				615
				616	if (TLI.isBigEndian())
				617	std::reverse(Parts, Parts + NumParts);
				618
				619	return;
				620	}
				621
				622	// Vector ValueVT.
				623	if (NumParts == 1) {
				624	if (PartVT != ValueVT) {
				625	if (PartVT.isVector()) {
				626	Val = DAG.getNode(ISD::BIT_CONVERT, PartVT, Val);
				627	} else {
				628	assert(ValueVT.getVectorElementType() == PartVT &&
				629	ValueVT.getVectorNumElements() == 1 &&
				630	"Only trivial vector-to-scalar conversions should get here!");
				631	Val = DAG.getNode(ISD::EXTRACT_VECTOR_ELT, PartVT, Val,
				632	DAG.getConstant(0, PtrVT));
				633	}
				634	}
				635
				636	Parts[0] = Val;
				637	return;
				638	}
				639
				640	// Handle a multi-element vector.
				641	MVT IntermediateVT, RegisterVT;
				642	unsigned NumIntermediates;
				643	unsigned NumRegs =
				644	DAG.getTargetLoweringInfo()
				645	.getVectorTypeBreakdown(ValueVT, IntermediateVT, NumIntermediates,
				646	RegisterVT);
				647	unsigned NumElements = ValueVT.getVectorNumElements();
				648
				649	assert(NumRegs == NumParts && "Part count doesn't match vector breakdown!");
				650	NumParts = NumRegs; // Silence a compiler warning.
				651	assert(RegisterVT == PartVT && "Part type doesn't match vector breakdown!");
				652
				653	// Split the vector into intermediate operands.
				654	SmallVector<SDValue, 8> Ops(NumIntermediates);
				655	for (unsigned i = 0; i != NumIntermediates; ++i)
				656	if (IntermediateVT.isVector())
				657	Ops[i] = DAG.getNode(ISD::EXTRACT_SUBVECTOR,
				658	IntermediateVT, Val,
				659	DAG.getConstant(i * (NumElements / NumIntermediates),
				660	PtrVT));
				661	else
				662	Ops[i] = DAG.getNode(ISD::EXTRACT_VECTOR_ELT,
				663	IntermediateVT, Val,
				664	DAG.getConstant(i, PtrVT));
				665
				666	// Split the intermediate operands into legal parts.
				667	if (NumParts == NumIntermediates) {
				668	// If the register was not expanded, promote or copy the value,
				669	// as appropriate.
				670	for (unsigned i = 0; i != NumParts; ++i)
				671	getCopyToParts(DAG, Ops[i], &Parts[i], 1, PartVT);
				672	} else if (NumParts > 0) {
				673	// If the intermediate type was expanded, split each the value into
				674	// legal parts.
				675	assert(NumParts % NumIntermediates == 0 &&
				676	"Must expand into a divisible number of parts!");
				677	unsigned Factor = NumParts / NumIntermediates;
				678	for (unsigned i = 0; i != NumIntermediates; ++i)
				679	getCopyToParts(DAG, Ops[i], &Parts[i * Factor], Factor, PartVT);
				680	}
				681	}
				682
				683
				684	void SelectionDAGLowering::init(GCFunctionInfo *gfi, AliasAnalysis &aa) {
				685	AA = &aa;
				686	GFI = gfi;
				687	TD = DAG.getTarget().getTargetData();
				688	}
				689
				690	/// clear - Clear out the curret SelectionDAG and the associated
				691	/// state and prepare this SelectionDAGLowering object to be used
				692	/// for a new block. This doesn't clear out information about
				693	/// additional blocks that are needed to complete switch lowering
				694	/// or PHI node updating; that information is cleared out as it is
				695	/// consumed.
				696	void SelectionDAGLowering::clear() {
				697	NodeMap.clear();
				698	PendingLoads.clear();
				699	PendingExports.clear();
				700	DAG.clear();
				701	}
				702
				703	/// getRoot - Return the current virtual root of the Selection DAG,
				704	/// flushing any PendingLoad items. This must be done before emitting
				705	/// a store or any other node that may need to be ordered after any
				706	/// prior load instructions.
				707	///
				708	SDValue SelectionDAGLowering::getRoot() {
				709	if (PendingLoads.empty())
				710	return DAG.getRoot();
				711
				712	if (PendingLoads.size() == 1) {
				713	SDValue Root = PendingLoads[0];
				714	DAG.setRoot(Root);
				715	PendingLoads.clear();
				716	return Root;
				717	}
				718
				719	// Otherwise, we have to make a token factor node.
				720	SDValue Root = DAG.getNode(ISD::TokenFactor, MVT::Other,
				721	&PendingLoads[0], PendingLoads.size());
				722	PendingLoads.clear();
				723	DAG.setRoot(Root);
				724	return Root;
				725	}
				726
				727	/// getControlRoot - Similar to getRoot, but instead of flushing all the
				728	/// PendingLoad items, flush all the PendingExports items. It is necessary
				729	/// to do this before emitting a terminator instruction.
				730	///
				731	SDValue SelectionDAGLowering::getControlRoot() {
				732	SDValue Root = DAG.getRoot();
				733
				734	if (PendingExports.empty())
				735	return Root;
				736
				737	// Turn all of the CopyToReg chains into one factored node.
				738	if (Root.getOpcode() != ISD::EntryToken) {
				739	unsigned i = 0, e = PendingExports.size();
				740	for (; i != e; ++i) {
				741	assert(PendingExports[i].getNode()->getNumOperands() > 1);
				742	if (PendingExports[i].getNode()->getOperand(0) == Root)
				743	break; // Don't add the root if we already indirectly depend on it.
				744	}
				745
				746	if (i == e)
				747	PendingExports.push_back(Root);
				748	}
				749
				750	Root = DAG.getNode(ISD::TokenFactor, MVT::Other,
				751	&PendingExports[0],
				752	PendingExports.size());
				753	PendingExports.clear();
				754	DAG.setRoot(Root);
				755	return Root;
				756	}
				757
				758	void SelectionDAGLowering::visit(Instruction &I) {
				759	visit(I.getOpcode(), I);
				760	}
				761
				762	void SelectionDAGLowering::visit(unsigned Opcode, User &I) {
				763	// Note: this doesn't use InstVisitor, because it has to work with
				764	// ConstantExpr's in addition to instructions.
				765	switch (Opcode) {
				766	default: assert(0 && "Unknown instruction type encountered!");
				767	abort();
				768	// Build the switch statement using the Instruction.def file.
				769	#define HANDLE_INST(NUM, OPCODE, CLASS) \
				770	case Instruction::OPCODE:return visit##OPCODE((CLASS&)I);
				771	#include "llvm/Instruction.def"
				772	}
				773	}
				774
				775	void SelectionDAGLowering::visitAdd(User &I) {
				776	if (I.getType()->isFPOrFPVector())
				777	visitBinary(I, ISD::FADD);
				778	else
				779	visitBinary(I, ISD::ADD);
				780	}
				781
				782	void SelectionDAGLowering::visitMul(User &I) {
				783	if (I.getType()->isFPOrFPVector())
				784	visitBinary(I, ISD::FMUL);
				785	else
				786	visitBinary(I, ISD::MUL);
				787	}
				788
				789	SDValue SelectionDAGLowering::getValue(const Value *V) {
				790	SDValue &N = NodeMap[V];
				791	if (N.getNode()) return N;
				792
				793	if (Constant C = const_cast<Constant>(dyn_cast<Constant>(V))) {
				794	MVT VT = TLI.getValueType(V->getType(), true);
				795
				796	if (ConstantInt *CI = dyn_cast<ConstantInt>(C))
				797	return N = DAG.getConstant(CI->getValue(), VT);
				798
				799	if (GlobalValue *GV = dyn_cast<GlobalValue>(C))
				800	return N = DAG.getGlobalAddress(GV, VT);
				801
				802	if (isa<ConstantPointerNull>(C))
				803	return N = DAG.getConstant(0, TLI.getPointerTy());
				804
				805	if (ConstantFP *CFP = dyn_cast<ConstantFP>(C))
				806	return N = DAG.getConstantFP(CFP->getValueAPF(), VT);
				807
				808	if (isa<UndefValue>(C) && !isa<VectorType>(V->getType()) &&
				809	!V->getType()->isAggregateType())
				810	return N = DAG.getNode(ISD::UNDEF, VT);
				811
				812	if (ConstantExpr *CE = dyn_cast<ConstantExpr>(C)) {
				813	visit(CE->getOpcode(), *CE);
				814	SDValue N1 = NodeMap[V];
				815	assert(N1.getNode() && "visit didn't populate the ValueMap!");
				816	return N1;
				817	}
				818
				819	if (isa<ConstantStruct>(C) \|\| isa<ConstantArray>(C)) {
				820	SmallVector<SDValue, 4> Constants;
				821	for (User::const_op_iterator OI = C->op_begin(), OE = C->op_end();
				822	OI != OE; ++OI) {
				823	SDNode Val = getValue(OI).getNode();
				824	for (unsigned i = 0, e = Val->getNumValues(); i != e; ++i)
				825	Constants.push_back(SDValue(Val, i));
				826	}
				827	return DAG.getMergeValues(&Constants[0], Constants.size());
				828	}
				829
				830	if (isa<StructType>(C->getType()) \|\| isa<ArrayType>(C->getType())) {
				831	assert((isa<ConstantAggregateZero>(C) \|\| isa<UndefValue>(C)) &&
				832	"Unknown struct or array constant!");
				833
				834	SmallVector<MVT, 4> ValueVTs;
				835	ComputeValueVTs(TLI, C->getType(), ValueVTs);
				836	unsigned NumElts = ValueVTs.size();
				837	if (NumElts == 0)
				838	return SDValue(); // empty struct
				839	SmallVector<SDValue, 4> Constants(NumElts);
				840	for (unsigned i = 0; i != NumElts; ++i) {
				841	MVT EltVT = ValueVTs[i];
				842	if (isa<UndefValue>(C))
				843	Constants[i] = DAG.getNode(ISD::UNDEF, EltVT);
				844	else if (EltVT.isFloatingPoint())
				845	Constants[i] = DAG.getConstantFP(0, EltVT);
				846	else
				847	Constants[i] = DAG.getConstant(0, EltVT);
				848	}
				849	return DAG.getMergeValues(&Constants[0], NumElts);
				850	}
				851
				852	const VectorType *VecTy = cast<VectorType>(V->getType());
				853	unsigned NumElements = VecTy->getNumElements();
				854
				855	// Now that we know the number and type of the elements, get that number of
				856	// elements into the Ops array based on what kind of constant it is.
				857	SmallVector<SDValue, 16> Ops;
				858	if (ConstantVector *CP = dyn_cast<ConstantVector>(C)) {
				859	for (unsigned i = 0; i != NumElements; ++i)
				860	Ops.push_back(getValue(CP->getOperand(i)));
				861	} else {
				862	assert((isa<ConstantAggregateZero>(C) \|\| isa<UndefValue>(C)) &&
				863	"Unknown vector constant!");
				864	MVT EltVT = TLI.getValueType(VecTy->getElementType());
				865
				866	SDValue Op;
				867	if (isa<UndefValue>(C))
				868	Op = DAG.getNode(ISD::UNDEF, EltVT);
				869	else if (EltVT.isFloatingPoint())
				870	Op = DAG.getConstantFP(0, EltVT);
				871	else
				872	Op = DAG.getConstant(0, EltVT);
				873	Ops.assign(NumElements, Op);
				874	}
				875
				876	// Create a BUILD_VECTOR node.
				877	return NodeMap[V] = DAG.getNode(ISD::BUILD_VECTOR, VT, &Ops[0], Ops.size());
				878	}
				879
				880	// If this is a static alloca, generate it as the frameindex instead of
				881	// computation.
				882	if (const AllocaInst *AI = dyn_cast<AllocaInst>(V)) {
				883	DenseMap<const AllocaInst*, int>::iterator SI =
				884	FuncInfo.StaticAllocaMap.find(AI);
				885	if (SI != FuncInfo.StaticAllocaMap.end())
				886	return DAG.getFrameIndex(SI->second, TLI.getPointerTy());
				887	}
				888
				889	unsigned InReg = FuncInfo.ValueMap[V];
				890	assert(InReg && "Value not in map!");
				891
				892	RegsForValue RFV(TLI, InReg, V->getType());
				893	SDValue Chain = DAG.getEntryNode();
				894	return RFV.getCopyFromRegs(DAG, Chain, NULL);
				895	}
				896
				897
				898	void SelectionDAGLowering::visitRet(ReturnInst &I) {
				899	if (I.getNumOperands() == 0) {
				900	DAG.setRoot(DAG.getNode(ISD::RET, MVT::Other, getControlRoot()));
				901	return;
				902	}
				903
				904	SmallVector<SDValue, 8> NewValues;
				905	NewValues.push_back(getControlRoot());
				906	for (unsigned i = 0, e = I.getNumOperands(); i != e; ++i) {
				907	SDValue RetOp = getValue(I.getOperand(i));
				908
				909	SmallVector<MVT, 4> ValueVTs;
				910	ComputeValueVTs(TLI, I.getOperand(i)->getType(), ValueVTs);
				911	for (unsigned j = 0, f = ValueVTs.size(); j != f; ++j) {
				912	MVT VT = ValueVTs[j];
				913
				914	// FIXME: C calling convention requires the return type to be promoted to
				915	// at least 32-bit. But this is not necessary for non-C calling conventions.
				916	if (VT.isInteger()) {
				917	MVT MinVT = TLI.getRegisterType(MVT::i32);
				918	if (VT.bitsLT(MinVT))
				919	VT = MinVT;
				920	}
				921
				922	unsigned NumParts = TLI.getNumRegisters(VT);
				923	MVT PartVT = TLI.getRegisterType(VT);
				924	SmallVector<SDValue, 4> Parts(NumParts);
				925	ISD::NodeType ExtendKind = ISD::ANY_EXTEND;
				926
				927	const Function *F = I.getParent()->getParent();
				928	if (F->paramHasAttr(0, ParamAttr::SExt))
				929	ExtendKind = ISD::SIGN_EXTEND;
				930	else if (F->paramHasAttr(0, ParamAttr::ZExt))
				931	ExtendKind = ISD::ZERO_EXTEND;
				932
				933	getCopyToParts(DAG, SDValue(RetOp.getNode(), RetOp.getResNo() + j),
				934	&Parts[0], NumParts, PartVT, ExtendKind);
				935
				936	for (unsigned i = 0; i < NumParts; ++i) {
				937	NewValues.push_back(Parts[i]);
				938	NewValues.push_back(DAG.getArgFlags(ISD::ArgFlagsTy()));
				939	}
				940	}
				941	}
				942	DAG.setRoot(DAG.getNode(ISD::RET, MVT::Other,
				943	&NewValues[0], NewValues.size()));
				944	}
				945
				946	/// ExportFromCurrentBlock - If this condition isn't known to be exported from
				947	/// the current basic block, add it to ValueMap now so that we'll get a
				948	/// CopyTo/FromReg.
				949	void SelectionDAGLowering::ExportFromCurrentBlock(Value *V) {
				950	// No need to export constants.
				951	if (!isa<Instruction>(V) && !isa<Argument>(V)) return;
				952
				953	// Already exported?
				954	if (FuncInfo.isExportedInst(V)) return;
				955
				956	unsigned Reg = FuncInfo.InitializeRegForValue(V);
				957	CopyValueToVirtualRegister(V, Reg);
				958	}
				959
				960	bool SelectionDAGLowering::isExportableFromCurrentBlock(Value *V,
				961	const BasicBlock *FromBB) {
				962	// The operands of the setcc have to be in this block. We don't know
				963	// how to export them from some other block.
				964	if (Instruction *VI = dyn_cast<Instruction>(V)) {
				965	// Can export from current BB.
				966	if (VI->getParent() == FromBB)
				967	return true;
				968
				969	// Is already exported, noop.
				970	return FuncInfo.isExportedInst(V);
				971	}
				972
				973	// If this is an argument, we can export it if the BB is the entry block or
				974	// if it is already exported.
				975	if (isa<Argument>(V)) {
				976	if (FromBB == &FromBB->getParent()->getEntryBlock())
				977	return true;
				978
				979	// Otherwise, can only export this if it is already exported.
				980	return FuncInfo.isExportedInst(V);
				981	}
				982
				983	// Otherwise, constants can always be exported.
				984	return true;
				985	}
				986
				987	static bool InBlock(const Value V, const BasicBlock BB) {
				988	if (const Instruction *I = dyn_cast<Instruction>(V))
				989	return I->getParent() == BB;
				990	return true;
				991	}
				992
				993	/// FindMergedConditions - If Cond is an expression like
				994	void SelectionDAGLowering::FindMergedConditions(Value *Cond,
				995	MachineBasicBlock *TBB,
				996	MachineBasicBlock *FBB,
				997	MachineBasicBlock *CurBB,
				998	unsigned Opc) {
				999	// If this node is not part of the or/and tree, emit it as a branch.
				1000	Instruction *BOp = dyn_cast<Instruction>(Cond);
				1001
				1002	if (!BOp \|\| !(isa<BinaryOperator>(BOp) \|\| isa<CmpInst>(BOp)) \|\|
				1003	(unsigned)BOp->getOpcode() != Opc \|\| !BOp->hasOneUse() \|\|
				1004	BOp->getParent() != CurBB->getBasicBlock() \|\|
				1005	!InBlock(BOp->getOperand(0), CurBB->getBasicBlock()) \|\|
				1006	!InBlock(BOp->getOperand(1), CurBB->getBasicBlock())) {
				1007	const BasicBlock *BB = CurBB->getBasicBlock();
				1008
				1009	// If the leaf of the tree is a comparison, merge the condition into
				1010	// the caseblock.
				1011	if ((isa<ICmpInst>(Cond) \|\| isa<FCmpInst>(Cond)) &&
				1012	// The operands of the cmp have to be in this block. We don't know
				1013	// how to export them from some other block. If this is the first block
				1014	// of the sequence, no exporting is needed.
				1015	(CurBB == CurMBB \|\|
				1016	(isExportableFromCurrentBlock(BOp->getOperand(0), BB) &&
				1017	isExportableFromCurrentBlock(BOp->getOperand(1), BB)))) {
				1018	BOp = cast<Instruction>(Cond);
				1019	ISD::CondCode Condition;
				1020	if (ICmpInst *IC = dyn_cast<ICmpInst>(Cond)) {
				1021	switch (IC->getPredicate()) {
				1022	default: assert(0 && "Unknown icmp predicate opcode!");
				1023	case ICmpInst::ICMP_EQ: Condition = ISD::SETEQ; break;
				1024	case ICmpInst::ICMP_NE: Condition = ISD::SETNE; break;
				1025	case ICmpInst::ICMP_SLE: Condition = ISD::SETLE; break;
				1026	case ICmpInst::ICMP_ULE: Condition = ISD::SETULE; break;
				1027	case ICmpInst::ICMP_SGE: Condition = ISD::SETGE; break;
				1028	case ICmpInst::ICMP_UGE: Condition = ISD::SETUGE; break;
				1029	case ICmpInst::ICMP_SLT: Condition = ISD::SETLT; break;
				1030	case ICmpInst::ICMP_ULT: Condition = ISD::SETULT; break;
				1031	case ICmpInst::ICMP_SGT: Condition = ISD::SETGT; break;
				1032	case ICmpInst::ICMP_UGT: Condition = ISD::SETUGT; break;
				1033	}
				1034	} else if (FCmpInst *FC = dyn_cast<FCmpInst>(Cond)) {
				1035	ISD::CondCode FPC, FOC;
				1036	switch (FC->getPredicate()) {
				1037	default: assert(0 && "Unknown fcmp predicate opcode!");
				1038	case FCmpInst::FCMP_FALSE: FOC = FPC = ISD::SETFALSE; break;
				1039	case FCmpInst::FCMP_OEQ: FOC = ISD::SETEQ; FPC = ISD::SETOEQ; break;
				1040	case FCmpInst::FCMP_OGT: FOC = ISD::SETGT; FPC = ISD::SETOGT; break;
				1041	case FCmpInst::FCMP_OGE: FOC = ISD::SETGE; FPC = ISD::SETOGE; break;
				1042	case FCmpInst::FCMP_OLT: FOC = ISD::SETLT; FPC = ISD::SETOLT; break;
				1043	case FCmpInst::FCMP_OLE: FOC = ISD::SETLE; FPC = ISD::SETOLE; break;
				1044	case FCmpInst::FCMP_ONE: FOC = ISD::SETNE; FPC = ISD::SETONE; break;
				1045	case FCmpInst::FCMP_ORD: FOC = FPC = ISD::SETO; break;
				1046	case FCmpInst::FCMP_UNO: FOC = FPC = ISD::SETUO; break;
				1047	case FCmpInst::FCMP_UEQ: FOC = ISD::SETEQ; FPC = ISD::SETUEQ; break;
				1048	case FCmpInst::FCMP_UGT: FOC = ISD::SETGT; FPC = ISD::SETUGT; break;
				1049	case FCmpInst::FCMP_UGE: FOC = ISD::SETGE; FPC = ISD::SETUGE; break;
				1050	case FCmpInst::FCMP_ULT: FOC = ISD::SETLT; FPC = ISD::SETULT; break;
				1051	case FCmpInst::FCMP_ULE: FOC = ISD::SETLE; FPC = ISD::SETULE; break;
				1052	case FCmpInst::FCMP_UNE: FOC = ISD::SETNE; FPC = ISD::SETUNE; break;
				1053	case FCmpInst::FCMP_TRUE: FOC = FPC = ISD::SETTRUE; break;
				1054	}
				1055	if (FiniteOnlyFPMath())
				1056	Condition = FOC;
				1057	else
				1058	Condition = FPC;
				1059	} else {
				1060	Condition = ISD::SETEQ; // silence warning.
				1061	assert(0 && "Unknown compare instruction");
				1062	}
				1063
				1064	CaseBlock CB(Condition, BOp->getOperand(0),
				1065	BOp->getOperand(1), NULL, TBB, FBB, CurBB);
				1066	SwitchCases.push_back(CB);
				1067	return;
				1068	}
				1069
				1070	// Create a CaseBlock record representing this branch.
				1071	CaseBlock CB(ISD::SETEQ, Cond, ConstantInt::getTrue(),
				1072	NULL, TBB, FBB, CurBB);
				1073	SwitchCases.push_back(CB);
				1074	return;
				1075	}
				1076
				1077
				1078	// Create TmpBB after CurBB.
				1079	MachineFunction::iterator BBI = CurBB;
				1080	MachineFunction &MF = DAG.getMachineFunction();
				1081	MachineBasicBlock *TmpBB = MF.CreateMachineBasicBlock(CurBB->getBasicBlock());
				1082	CurBB->getParent()->insert(++BBI, TmpBB);
				1083
				1084	if (Opc == Instruction::Or) {
				1085	// Codegen X \| Y as:
				1086	// jmp_if_X TBB
				1087	// jmp TmpBB
				1088	// TmpBB:
				1089	// jmp_if_Y TBB
				1090	// jmp FBB
				1091	//
				1092
				1093	// Emit the LHS condition.
				1094	FindMergedConditions(BOp->getOperand(0), TBB, TmpBB, CurBB, Opc);
				1095
				1096	// Emit the RHS condition into TmpBB.
				1097	FindMergedConditions(BOp->getOperand(1), TBB, FBB, TmpBB, Opc);
				1098	} else {
				1099	assert(Opc == Instruction::And && "Unknown merge op!");
				1100	// Codegen X & Y as:
				1101	// jmp_if_X TmpBB
				1102	// jmp FBB
				1103	// TmpBB:
				1104	// jmp_if_Y TBB
				1105	// jmp FBB
				1106	//
				1107	// This requires creation of TmpBB after CurBB.
				1108
				1109	// Emit the LHS condition.
				1110	FindMergedConditions(BOp->getOperand(0), TmpBB, FBB, CurBB, Opc);
				1111
				1112	// Emit the RHS condition into TmpBB.
				1113	FindMergedConditions(BOp->getOperand(1), TBB, FBB, TmpBB, Opc);
				1114	}
				1115	}
				1116
				1117	/// If the set of cases should be emitted as a series of branches, return true.
				1118	/// If we should emit this as a bunch of and/or'd together conditions, return
				1119	/// false.
				1120	bool
				1121	SelectionDAGLowering::ShouldEmitAsBranches(const std::vector<CaseBlock> &Cases){
				1122	if (Cases.size() != 2) return true;
				1123
				1124	// If this is two comparisons of the same values or'd or and'd together, they
				1125	// will get folded into a single comparison, so don't emit two blocks.
				1126	if ((Cases[0].CmpLHS == Cases[1].CmpLHS &&
				1127	Cases[0].CmpRHS == Cases[1].CmpRHS) \|\|
				1128	(Cases[0].CmpRHS == Cases[1].CmpLHS &&
				1129	Cases[0].CmpLHS == Cases[1].CmpRHS)) {
				1130	return false;
				1131	}
				1132
				1133	return true;
				1134	}
				1135
				1136	void SelectionDAGLowering::visitBr(BranchInst &I) {
				1137	// Update machine-CFG edges.
				1138	MachineBasicBlock *Succ0MBB = FuncInfo.MBBMap[I.getSuccessor(0)];
				1139
				1140	// Figure out which block is immediately after the current one.
				1141	MachineBasicBlock *NextBlock = 0;
				1142	MachineFunction::iterator BBI = CurMBB;
				1143	if (++BBI != CurMBB->getParent()->end())
				1144	NextBlock = BBI;
				1145
				1146	if (I.isUnconditional()) {
				1147	// Update machine-CFG edges.
				1148	CurMBB->addSuccessor(Succ0MBB);
				1149
				1150	// If this is not a fall-through branch, emit the branch.
				1151	if (Succ0MBB != NextBlock)
				1152	DAG.setRoot(DAG.getNode(ISD::BR, MVT::Other, getControlRoot(),
				1153	DAG.getBasicBlock(Succ0MBB)));
				1154	return;
				1155	}
				1156
				1157	// If this condition is one of the special cases we handle, do special stuff
				1158	// now.
				1159	Value *CondVal = I.getCondition();
				1160	MachineBasicBlock *Succ1MBB = FuncInfo.MBBMap[I.getSuccessor(1)];
				1161
				1162	// If this is a series of conditions that are or'd or and'd together, emit
				1163	// this as a sequence of branches instead of setcc's with and/or operations.
				1164	// For example, instead of something like:
				1165	// cmp A, B
				1166	// C = seteq
				1167	// cmp D, E
				1168	// F = setle
				1169	// or C, F
				1170	// jnz foo
				1171	// Emit:
				1172	// cmp A, B
				1173	// je foo
				1174	// cmp D, E
				1175	// jle foo
				1176	//
				1177	if (BinaryOperator *BOp = dyn_cast<BinaryOperator>(CondVal)) {
				1178	if (BOp->hasOneUse() &&
				1179	(BOp->getOpcode() == Instruction::And \|\|
				1180	BOp->getOpcode() == Instruction::Or)) {
				1181	FindMergedConditions(BOp, Succ0MBB, Succ1MBB, CurMBB, BOp->getOpcode());
				1182	// If the compares in later blocks need to use values not currently
				1183	// exported from this block, export them now. This block should always
				1184	// be the first entry.
				1185	assert(SwitchCases[0].ThisBB == CurMBB && "Unexpected lowering!");
				1186
				1187	// Allow some cases to be rejected.
				1188	if (ShouldEmitAsBranches(SwitchCases)) {
				1189	for (unsigned i = 1, e = SwitchCases.size(); i != e; ++i) {
				1190	ExportFromCurrentBlock(SwitchCases[i].CmpLHS);
				1191	ExportFromCurrentBlock(SwitchCases[i].CmpRHS);
				1192	}
				1193
				1194	// Emit the branch for this block.
				1195	visitSwitchCase(SwitchCases[0]);
				1196	SwitchCases.erase(SwitchCases.begin());
				1197	return;
				1198	}
				1199
				1200	// Okay, we decided not to do this, remove any inserted MBB's and clear
				1201	// SwitchCases.
				1202	for (unsigned i = 1, e = SwitchCases.size(); i != e; ++i)
				1203	CurMBB->getParent()->erase(SwitchCases[i].ThisBB);
				1204
				1205	SwitchCases.clear();
				1206	}
				1207	}
				1208
				1209	// Create a CaseBlock record representing this branch.
				1210	CaseBlock CB(ISD::SETEQ, CondVal, ConstantInt::getTrue(),
				1211	NULL, Succ0MBB, Succ1MBB, CurMBB);
				1212	// Use visitSwitchCase to actually insert the fast branch sequence for this
				1213	// cond branch.
				1214	visitSwitchCase(CB);
				1215	}
				1216
				1217	/// visitSwitchCase - Emits the necessary code to represent a single node in
				1218	/// the binary search tree resulting from lowering a switch instruction.
				1219	void SelectionDAGLowering::visitSwitchCase(CaseBlock &CB) {
				1220	SDValue Cond;
				1221	SDValue CondLHS = getValue(CB.CmpLHS);
				1222
				1223	// Build the setcc now.
				1224	if (CB.CmpMHS == NULL) {
				1225	// Fold "(X == true)" to X and "(X == false)" to !X to
				1226	// handle common cases produced by branch lowering.
				1227	if (CB.CmpRHS == ConstantInt::getTrue() && CB.CC == ISD::SETEQ)
				1228	Cond = CondLHS;
				1229	else if (CB.CmpRHS == ConstantInt::getFalse() && CB.CC == ISD::SETEQ) {
				1230	SDValue True = DAG.getConstant(1, CondLHS.getValueType());
				1231	Cond = DAG.getNode(ISD::XOR, CondLHS.getValueType(), CondLHS, True);
				1232	} else
				1233	Cond = DAG.getSetCC(MVT::i1, CondLHS, getValue(CB.CmpRHS), CB.CC);
				1234	} else {
				1235	assert(CB.CC == ISD::SETLE && "Can handle only LE ranges now");
				1236
				1237	uint64_t Low = cast<ConstantInt>(CB.CmpLHS)->getSExtValue();
				1238	uint64_t High = cast<ConstantInt>(CB.CmpRHS)->getSExtValue();
				1239
				1240	SDValue CmpOp = getValue(CB.CmpMHS);
				1241	MVT VT = CmpOp.getValueType();
				1242
				1243	if (cast<ConstantInt>(CB.CmpLHS)->isMinValue(true)) {
				1244	Cond = DAG.getSetCC(MVT::i1, CmpOp, DAG.getConstant(High, VT), ISD::SETLE);
				1245	} else {
				1246	SDValue SUB = DAG.getNode(ISD::SUB, VT, CmpOp, DAG.getConstant(Low, VT));
				1247	Cond = DAG.getSetCC(MVT::i1, SUB,
				1248	DAG.getConstant(High-Low, VT), ISD::SETULE);
				1249	}
				1250	}
				1251
				1252	// Update successor info
				1253	CurMBB->addSuccessor(CB.TrueBB);
				1254	CurMBB->addSuccessor(CB.FalseBB);
				1255
				1256	// Set NextBlock to be the MBB immediately after the current one, if any.
				1257	// This is used to avoid emitting unnecessary branches to the next block.
				1258	MachineBasicBlock *NextBlock = 0;
				1259	MachineFunction::iterator BBI = CurMBB;
				1260	if (++BBI != CurMBB->getParent()->end())
				1261	NextBlock = BBI;
				1262
				1263	// If the lhs block is the next block, invert the condition so that we can
				1264	// fall through to the lhs instead of the rhs block.
				1265	if (CB.TrueBB == NextBlock) {
				1266	std::swap(CB.TrueBB, CB.FalseBB);
				1267	SDValue True = DAG.getConstant(1, Cond.getValueType());
				1268	Cond = DAG.getNode(ISD::XOR, Cond.getValueType(), Cond, True);
				1269	}
				1270	SDValue BrCond = DAG.getNode(ISD::BRCOND, MVT::Other, getControlRoot(), Cond,
				1271	DAG.getBasicBlock(CB.TrueBB));
				1272
				1273	// If the branch was constant folded, fix up the CFG.
				1274	if (BrCond.getOpcode() == ISD::BR) {
				1275	CurMBB->removeSuccessor(CB.FalseBB);
				1276	DAG.setRoot(BrCond);
				1277	} else {
				1278	// Otherwise, go ahead and insert the false branch.
				1279	if (BrCond == getControlRoot())
				1280	CurMBB->removeSuccessor(CB.TrueBB);
				1281
				1282	if (CB.FalseBB == NextBlock)
				1283	DAG.setRoot(BrCond);
				1284	else
				1285	DAG.setRoot(DAG.getNode(ISD::BR, MVT::Other, BrCond,
				1286	DAG.getBasicBlock(CB.FalseBB)));
				1287	}
				1288	}
				1289
				1290	/// visitJumpTable - Emit JumpTable node in the current MBB
				1291	void SelectionDAGLowering::visitJumpTable(JumpTable &JT) {
				1292	// Emit the code for the jump table
				1293	assert(JT.Reg != -1U && "Should lower JT Header first!");
				1294	MVT PTy = TLI.getPointerTy();
				1295	SDValue Index = DAG.getCopyFromReg(getControlRoot(), JT.Reg, PTy);
				1296	SDValue Table = DAG.getJumpTable(JT.JTI, PTy);
				1297	DAG.setRoot(DAG.getNode(ISD::BR_JT, MVT::Other, Index.getValue(1),
				1298	Table, Index));
				1299	return;
				1300	}
				1301
				1302	/// visitJumpTableHeader - This function emits necessary code to produce index
				1303	/// in the JumpTable from switch case.
				1304	void SelectionDAGLowering::visitJumpTableHeader(JumpTable &JT,
				1305	JumpTableHeader &JTH) {
				1306	// Subtract the lowest switch case value from the value being switched on
				1307	// and conditional branch to default mbb if the result is greater than the
				1308	// difference between smallest and largest cases.
				1309	SDValue SwitchOp = getValue(JTH.SValue);
				1310	MVT VT = SwitchOp.getValueType();
				1311	SDValue SUB = DAG.getNode(ISD::SUB, VT, SwitchOp,
				1312	DAG.getConstant(JTH.First, VT));
				1313
				1314	// The SDNode we just created, which holds the value being switched on
				1315	// minus the the smallest case value, needs to be copied to a virtual
				1316	// register so it can be used as an index into the jump table in a
				1317	// subsequent basic block. This value may be smaller or larger than the
				1318	// target's pointer type, and therefore require extension or truncating.
				1319	if (VT.bitsGT(TLI.getPointerTy()))
				1320	SwitchOp = DAG.getNode(ISD::TRUNCATE, TLI.getPointerTy(), SUB);
				1321	else
				1322	SwitchOp = DAG.getNode(ISD::ZERO_EXTEND, TLI.getPointerTy(), SUB);
				1323
				1324	unsigned JumpTableReg = FuncInfo.MakeReg(TLI.getPointerTy());
				1325	SDValue CopyTo = DAG.getCopyToReg(getControlRoot(), JumpTableReg, SwitchOp);
				1326	JT.Reg = JumpTableReg;
				1327
				1328	// Emit the range check for the jump table, and branch to the default
				1329	// block for the switch statement if the value being switched on exceeds
				1330	// the largest case in the switch.
				1331	SDValue CMP = DAG.getSetCC(TLI.getSetCCResultType(SUB), SUB,
				1332	DAG.getConstant(JTH.Last-JTH.First,VT),
				1333	ISD::SETUGT);
				1334
				1335	// Set NextBlock to be the MBB immediately after the current one, if any.
				1336	// This is used to avoid emitting unnecessary branches to the next block.
				1337	MachineBasicBlock *NextBlock = 0;
				1338	MachineFunction::iterator BBI = CurMBB;
				1339	if (++BBI != CurMBB->getParent()->end())
				1340	NextBlock = BBI;
				1341
				1342	SDValue BrCond = DAG.getNode(ISD::BRCOND, MVT::Other, CopyTo, CMP,
				1343	DAG.getBasicBlock(JT.Default));
				1344
				1345	if (JT.MBB == NextBlock)
				1346	DAG.setRoot(BrCond);
				1347	else
				1348	DAG.setRoot(DAG.getNode(ISD::BR, MVT::Other, BrCond,
				1349	DAG.getBasicBlock(JT.MBB)));
				1350
				1351	return;
				1352	}
				1353
				1354	/// visitBitTestHeader - This function emits necessary code to produce value
				1355	/// suitable for "bit tests"
				1356	void SelectionDAGLowering::visitBitTestHeader(BitTestBlock &B) {
				1357	// Subtract the minimum value
				1358	SDValue SwitchOp = getValue(B.SValue);
				1359	MVT VT = SwitchOp.getValueType();
				1360	SDValue SUB = DAG.getNode(ISD::SUB, VT, SwitchOp,
				1361	DAG.getConstant(B.First, VT));
				1362
				1363	// Check range
				1364	SDValue RangeCmp = DAG.getSetCC(TLI.getSetCCResultType(SUB), SUB,
				1365	DAG.getConstant(B.Range, VT),
				1366	ISD::SETUGT);
				1367
				1368	SDValue ShiftOp;
				1369	if (VT.bitsGT(TLI.getShiftAmountTy()))
				1370	ShiftOp = DAG.getNode(ISD::TRUNCATE, TLI.getShiftAmountTy(), SUB);
				1371	else
				1372	ShiftOp = DAG.getNode(ISD::ZERO_EXTEND, TLI.getShiftAmountTy(), SUB);
				1373
				1374	// Make desired shift
				1375	SDValue SwitchVal = DAG.getNode(ISD::SHL, TLI.getPointerTy(),
				1376	DAG.getConstant(1, TLI.getPointerTy()),
				1377	ShiftOp);
				1378
				1379	unsigned SwitchReg = FuncInfo.MakeReg(TLI.getPointerTy());
				1380	SDValue CopyTo = DAG.getCopyToReg(getControlRoot(), SwitchReg, SwitchVal);
				1381	B.Reg = SwitchReg;
				1382
				1383	// Set NextBlock to be the MBB immediately after the current one, if any.
				1384	// This is used to avoid emitting unnecessary branches to the next block.
				1385	MachineBasicBlock *NextBlock = 0;
				1386	MachineFunction::iterator BBI = CurMBB;
				1387	if (++BBI != CurMBB->getParent()->end())
				1388	NextBlock = BBI;
				1389
				1390	MachineBasicBlock* MBB = B.Cases[0].ThisBB;
				1391
				1392	CurMBB->addSuccessor(B.Default);
				1393	CurMBB->addSuccessor(MBB);
				1394
				1395	SDValue BrRange = DAG.getNode(ISD::BRCOND, MVT::Other, CopyTo, RangeCmp,
				1396	DAG.getBasicBlock(B.Default));
				1397
				1398	if (MBB == NextBlock)
				1399	DAG.setRoot(BrRange);
				1400	else
				1401	DAG.setRoot(DAG.getNode(ISD::BR, MVT::Other, CopyTo,
				1402	DAG.getBasicBlock(MBB)));
				1403
				1404	return;
				1405	}
				1406
				1407	/// visitBitTestCase - this function produces one "bit test"
				1408	void SelectionDAGLowering::visitBitTestCase(MachineBasicBlock* NextMBB,
				1409	unsigned Reg,
				1410	BitTestCase &B) {
				1411	// Emit bit tests and jumps
				1412	SDValue SwitchVal = DAG.getCopyFromReg(getControlRoot(), Reg,
				1413	TLI.getPointerTy());
				1414
				1415	SDValue AndOp = DAG.getNode(ISD::AND, TLI.getPointerTy(), SwitchVal,
				1416	DAG.getConstant(B.Mask, TLI.getPointerTy()));
				1417	SDValue AndCmp = DAG.getSetCC(TLI.getSetCCResultType(AndOp), AndOp,
				1418	DAG.getConstant(0, TLI.getPointerTy()),
				1419	ISD::SETNE);
				1420
				1421	CurMBB->addSuccessor(B.TargetBB);
				1422	CurMBB->addSuccessor(NextMBB);
				1423
				1424	SDValue BrAnd = DAG.getNode(ISD::BRCOND, MVT::Other, getControlRoot(),
				1425	AndCmp, DAG.getBasicBlock(B.TargetBB));
				1426
				1427	// Set NextBlock to be the MBB immediately after the current one, if any.
				1428	// This is used to avoid emitting unnecessary branches to the next block.
				1429	MachineBasicBlock *NextBlock = 0;
				1430	MachineFunction::iterator BBI = CurMBB;
				1431	if (++BBI != CurMBB->getParent()->end())
				1432	NextBlock = BBI;
				1433
				1434	if (NextMBB == NextBlock)
				1435	DAG.setRoot(BrAnd);
				1436	else
				1437	DAG.setRoot(DAG.getNode(ISD::BR, MVT::Other, BrAnd,
				1438	DAG.getBasicBlock(NextMBB)));
				1439
				1440	return;
				1441	}
				1442
				1443	void SelectionDAGLowering::visitInvoke(InvokeInst &I) {
				1444	// Retrieve successors.
				1445	MachineBasicBlock *Return = FuncInfo.MBBMap[I.getSuccessor(0)];
				1446	MachineBasicBlock *LandingPad = FuncInfo.MBBMap[I.getSuccessor(1)];
				1447
				1448	if (isa<InlineAsm>(I.getCalledValue()))
				1449	visitInlineAsm(&I);
				1450	else
				1451	LowerCallTo(&I, getValue(I.getOperand(0)), false, LandingPad);
				1452
				1453	// If the value of the invoke is used outside of its defining block, make it
				1454	// available as a virtual register.
				1455	if (!I.use_empty()) {
				1456	DenseMap<const Value*, unsigned>::iterator VMI = FuncInfo.ValueMap.find(&I);
				1457	if (VMI != FuncInfo.ValueMap.end())
				1458	CopyValueToVirtualRegister(&I, VMI->second);
				1459	}
				1460
				1461	// Update successor info
				1462	CurMBB->addSuccessor(Return);
				1463	CurMBB->addSuccessor(LandingPad);
				1464
				1465	// Drop into normal successor.
				1466	DAG.setRoot(DAG.getNode(ISD::BR, MVT::Other, getControlRoot(),
				1467	DAG.getBasicBlock(Return)));
				1468	}
				1469
				1470	void SelectionDAGLowering::visitUnwind(UnwindInst &I) {
				1471	}
				1472
				1473	/// handleSmallSwitchCaseRange - Emit a series of specific tests (suitable for
				1474	/// small case ranges).
				1475	bool SelectionDAGLowering::handleSmallSwitchRange(CaseRec& CR,
				1476	CaseRecVector& WorkList,
				1477	Value* SV,
				1478	MachineBasicBlock* Default) {
				1479	Case& BackCase = *(CR.Range.second-1);
				1480
				1481	// Size is the number of Cases represented by this range.
				1482	unsigned Size = CR.Range.second - CR.Range.first;
				1483	if (Size > 3)
				1484	return false;
				1485
				1486	// Get the MachineFunction which holds the current MBB. This is used when
				1487	// inserting any additional MBBs necessary to represent the switch.
				1488	MachineFunction *CurMF = CurMBB->getParent();
				1489
				1490	// Figure out which block is immediately after the current one.
				1491	MachineBasicBlock *NextBlock = 0;
				1492	MachineFunction::iterator BBI = CR.CaseBB;
				1493
				1494	if (++BBI != CurMBB->getParent()->end())
				1495	NextBlock = BBI;
				1496
				1497	// TODO: If any two of the cases has the same destination, and if one value
				1498	// is the same as the other, but has one bit unset that the other has set,
				1499	// use bit manipulation to do two compares at once. For example:
				1500	// "if (X == 6 \|\| X == 4)" -> "if ((X\|2) == 6)"
				1501
				1502	// Rearrange the case blocks so that the last one falls through if possible.
				1503	if (NextBlock && Default != NextBlock && BackCase.BB != NextBlock) {
				1504	// The last case block won't fall through into 'NextBlock' if we emit the
				1505	// branches in this order. See if rearranging a case value would help.
				1506	for (CaseItr I = CR.Range.first, E = CR.Range.second-1; I != E; ++I) {
				1507	if (I->BB == NextBlock) {
				1508	std::swap(*I, BackCase);
				1509	break;
				1510	}
				1511	}
				1512	}
				1513
				1514	// Create a CaseBlock record representing a conditional branch to
				1515	// the Case's target mbb if the value being switched on SV is equal
				1516	// to C.
				1517	MachineBasicBlock *CurBlock = CR.CaseBB;
				1518	for (CaseItr I = CR.Range.first, E = CR.Range.second; I != E; ++I) {
				1519	MachineBasicBlock *FallThrough;
				1520	if (I != E-1) {
				1521	FallThrough = CurMF->CreateMachineBasicBlock(CurBlock->getBasicBlock());
				1522	CurMF->insert(BBI, FallThrough);
				1523	} else {
				1524	// If the last case doesn't match, go to the default block.
				1525	FallThrough = Default;
				1526	}
				1527
				1528	Value RHS, LHS, *MHS;
				1529	ISD::CondCode CC;
				1530	if (I->High == I->Low) {
				1531	// This is just small small case range :) containing exactly 1 case
				1532	CC = ISD::SETEQ;
				1533	LHS = SV; RHS = I->High; MHS = NULL;
				1534	} else {
				1535	CC = ISD::SETLE;
				1536	LHS = I->Low; MHS = SV; RHS = I->High;
				1537	}
				1538	CaseBlock CB(CC, LHS, RHS, MHS, I->BB, FallThrough, CurBlock);
				1539
				1540	// If emitting the first comparison, just call visitSwitchCase to emit the
				1541	// code into the current block. Otherwise, push the CaseBlock onto the
				1542	// vector to be later processed by SDISel, and insert the node's MBB
				1543	// before the next MBB.
				1544	if (CurBlock == CurMBB)
				1545	visitSwitchCase(CB);
				1546	else
				1547	SwitchCases.push_back(CB);
				1548
				1549	CurBlock = FallThrough;
				1550	}
				1551
				1552	return true;
				1553	}
				1554
				1555	static inline bool areJTsAllowed(const TargetLowering &TLI) {
				1556	return !DisableJumpTables &&
				1557	(TLI.isOperationLegal(ISD::BR_JT, MVT::Other) \|\|
				1558	TLI.isOperationLegal(ISD::BRIND, MVT::Other));
				1559	}
				1560
				1561	/// handleJTSwitchCase - Emit jumptable for current switch case range
				1562	bool SelectionDAGLowering::handleJTSwitchCase(CaseRec& CR,
				1563	CaseRecVector& WorkList,
				1564	Value* SV,
				1565	MachineBasicBlock* Default) {
				1566	Case& FrontCase = *CR.Range.first;
				1567	Case& BackCase = *(CR.Range.second-1);
				1568
				1569	int64_t First = cast<ConstantInt>(FrontCase.Low)->getSExtValue();
				1570	int64_t Last = cast<ConstantInt>(BackCase.High)->getSExtValue();
				1571
				1572	uint64_t TSize = 0;
				1573	for (CaseItr I = CR.Range.first, E = CR.Range.second;
				1574	I!=E; ++I)
				1575	TSize += I->size();
				1576
				1577	if (!areJTsAllowed(TLI) \|\| TSize <= 3)
				1578	return false;
				1579
				1580	double Density = (double)TSize / (double)((Last - First) + 1ULL);
				1581	if (Density < 0.4)
				1582	return false;
				1583
				1584	DOUT << "Lowering jump table\n"
				1585	<< "First entry: " << First << ". Last entry: " << Last << "\n"
				1586	<< "Size: " << TSize << ". Density: " << Density << "\n\n";
				1587
				1588	// Get the MachineFunction which holds the current MBB. This is used when
				1589	// inserting any additional MBBs necessary to represent the switch.
				1590	MachineFunction *CurMF = CurMBB->getParent();
				1591
				1592	// Figure out which block is immediately after the current one.
				1593	MachineBasicBlock *NextBlock = 0;
				1594	MachineFunction::iterator BBI = CR.CaseBB;
				1595
				1596	if (++BBI != CurMBB->getParent()->end())
				1597	NextBlock = BBI;
				1598
				1599	const BasicBlock *LLVMBB = CR.CaseBB->getBasicBlock();
				1600
				1601	// Create a new basic block to hold the code for loading the address
				1602	// of the jump table, and jumping to it. Update successor information;
				1603	// we will either branch to the default case for the switch, or the jump
				1604	// table.
				1605	MachineBasicBlock *JumpTableBB = CurMF->CreateMachineBasicBlock(LLVMBB);
				1606	CurMF->insert(BBI, JumpTableBB);
				1607	CR.CaseBB->addSuccessor(Default);
				1608	CR.CaseBB->addSuccessor(JumpTableBB);
				1609
				1610	// Build a vector of destination BBs, corresponding to each target
				1611	// of the jump table. If the value of the jump table slot corresponds to
				1612	// a case statement, push the case's BB onto the vector, otherwise, push
				1613	// the default BB.
				1614	std::vector<MachineBasicBlock*> DestBBs;
				1615	int64_t TEI = First;
				1616	for (CaseItr I = CR.Range.first, E = CR.Range.second; I != E; ++TEI) {
				1617	int64_t Low = cast<ConstantInt>(I->Low)->getSExtValue();
				1618	int64_t High = cast<ConstantInt>(I->High)->getSExtValue();
				1619
				1620	if ((Low <= TEI) && (TEI <= High)) {
				1621	DestBBs.push_back(I->BB);
				1622	if (TEI==High)
				1623	++I;
				1624	} else {
				1625	DestBBs.push_back(Default);
				1626	}
				1627	}
				1628
				1629	// Update successor info. Add one edge to each unique successor.
				1630	BitVector SuccsHandled(CR.CaseBB->getParent()->getNumBlockIDs());
				1631	for (std::vector<MachineBasicBlock*>::iterator I = DestBBs.begin(),
				1632	E = DestBBs.end(); I != E; ++I) {
				1633	if (!SuccsHandled[(*I)->getNumber()]) {
				1634	SuccsHandled[(*I)->getNumber()] = true;
				1635	JumpTableBB->addSuccessor(*I);
				1636	}
				1637	}
				1638
				1639	// Create a jump table index for this jump table, or return an existing
				1640	// one.
				1641	unsigned JTI = CurMF->getJumpTableInfo()->getJumpTableIndex(DestBBs);
				1642
				1643	// Set the jump table information so that we can codegen it as a second
				1644	// MachineBasicBlock
				1645	JumpTable JT(-1U, JTI, JumpTableBB, Default);
				1646	JumpTableHeader JTH(First, Last, SV, CR.CaseBB, (CR.CaseBB == CurMBB));
				1647	if (CR.CaseBB == CurMBB)
				1648	visitJumpTableHeader(JT, JTH);
				1649
				1650	JTCases.push_back(JumpTableBlock(JTH, JT));
				1651
				1652	return true;
				1653	}
				1654
				1655	/// handleBTSplitSwitchCase - emit comparison and split binary search tree into
				1656	/// 2 subtrees.
				1657	bool SelectionDAGLowering::handleBTSplitSwitchCase(CaseRec& CR,
				1658	CaseRecVector& WorkList,
				1659	Value* SV,
				1660	MachineBasicBlock* Default) {
				1661	// Get the MachineFunction which holds the current MBB. This is used when
				1662	// inserting any additional MBBs necessary to represent the switch.
				1663	MachineFunction *CurMF = CurMBB->getParent();
				1664
				1665	// Figure out which block is immediately after the current one.
				1666	MachineBasicBlock *NextBlock = 0;
				1667	MachineFunction::iterator BBI = CR.CaseBB;
				1668
				1669	if (++BBI != CurMBB->getParent()->end())
				1670	NextBlock = BBI;
				1671
				1672	Case& FrontCase = *CR.Range.first;
				1673	Case& BackCase = *(CR.Range.second-1);
				1674	const BasicBlock *LLVMBB = CR.CaseBB->getBasicBlock();
				1675
				1676	// Size is the number of Cases represented by this range.
				1677	unsigned Size = CR.Range.second - CR.Range.first;
				1678
				1679	int64_t First = cast<ConstantInt>(FrontCase.Low)->getSExtValue();
				1680	int64_t Last = cast<ConstantInt>(BackCase.High)->getSExtValue();
				1681	double FMetric = 0;
				1682	CaseItr Pivot = CR.Range.first + Size/2;
				1683
				1684	// Select optimal pivot, maximizing sum density of LHS and RHS. This will
				1685	// (heuristically) allow us to emit JumpTable's later.
				1686	uint64_t TSize = 0;
				1687	for (CaseItr I = CR.Range.first, E = CR.Range.second;
				1688	I!=E; ++I)
				1689	TSize += I->size();
				1690
				1691	uint64_t LSize = FrontCase.size();
				1692	uint64_t RSize = TSize-LSize;
				1693	DOUT << "Selecting best pivot: \n"
				1694	<< "First: " << First << ", Last: " << Last <<"\n"
				1695	<< "LSize: " << LSize << ", RSize: " << RSize << "\n";
				1696	for (CaseItr I = CR.Range.first, J=I+1, E = CR.Range.second;
				1697	J!=E; ++I, ++J) {
				1698	int64_t LEnd = cast<ConstantInt>(I->High)->getSExtValue();
				1699	int64_t RBegin = cast<ConstantInt>(J->Low)->getSExtValue();
				1700	assert((RBegin-LEnd>=1) && "Invalid case distance");
				1701	double LDensity = (double)LSize / (double)((LEnd - First) + 1ULL);
				1702	double RDensity = (double)RSize / (double)((Last - RBegin) + 1ULL);
				1703	double Metric = Log2_64(RBegin-LEnd)*(LDensity+RDensity);
				1704	// Should always split in some non-trivial place
				1705	DOUT <<"=>Step\n"
				1706	<< "LEnd: " << LEnd << ", RBegin: " << RBegin << "\n"
				1707	<< "LDensity: " << LDensity << ", RDensity: " << RDensity << "\n"
				1708	<< "Metric: " << Metric << "\n";
				1709	if (FMetric < Metric) {
				1710	Pivot = J;
				1711	FMetric = Metric;
				1712	DOUT << "Current metric set to: " << FMetric << "\n";
				1713	}
				1714
				1715	LSize += J->size();
				1716	RSize -= J->size();
				1717	}
				1718	if (areJTsAllowed(TLI)) {
				1719	// If our case is dense we really should handle it earlier!
				1720	assert((FMetric > 0) && "Should handle dense range earlier!");
				1721	} else {
				1722	Pivot = CR.Range.first + Size/2;
				1723	}
				1724
				1725	CaseRange LHSR(CR.Range.first, Pivot);
				1726	CaseRange RHSR(Pivot, CR.Range.second);
				1727	Constant *C = Pivot->Low;
				1728	MachineBasicBlock FalseBB = 0, TrueBB = 0;
				1729
				1730	// We know that we branch to the LHS if the Value being switched on is
				1731	// less than the Pivot value, C. We use this to optimize our binary
				1732	// tree a bit, by recognizing that if SV is greater than or equal to the
				1733	// LHS's Case Value, and that Case Value is exactly one less than the
				1734	// Pivot's Value, then we can branch directly to the LHS's Target,
				1735	// rather than creating a leaf node for it.
				1736	if ((LHSR.second - LHSR.first) == 1 &&
				1737	LHSR.first->High == CR.GE &&
				1738	cast<ConstantInt>(C)->getSExtValue() ==
				1739	(cast<ConstantInt>(CR.GE)->getSExtValue() + 1LL)) {
				1740	TrueBB = LHSR.first->BB;
				1741	} else {
				1742	TrueBB = CurMF->CreateMachineBasicBlock(LLVMBB);
				1743	CurMF->insert(BBI, TrueBB);
				1744	WorkList.push_back(CaseRec(TrueBB, C, CR.GE, LHSR));
				1745	}
				1746
				1747	// Similar to the optimization above, if the Value being switched on is
				1748	// known to be less than the Constant CR.LT, and the current Case Value
				1749	// is CR.LT - 1, then we can branch directly to the target block for
				1750	// the current Case Value, rather than emitting a RHS leaf node for it.
				1751	if ((RHSR.second - RHSR.first) == 1 && CR.LT &&
				1752	cast<ConstantInt>(RHSR.first->Low)->getSExtValue() ==
				1753	(cast<ConstantInt>(CR.LT)->getSExtValue() - 1LL)) {
				1754	FalseBB = RHSR.first->BB;
				1755	} else {
				1756	FalseBB = CurMF->CreateMachineBasicBlock(LLVMBB);
				1757	CurMF->insert(BBI, FalseBB);
				1758	WorkList.push_back(CaseRec(FalseBB,CR.LT,C,RHSR));
				1759	}
				1760
				1761	// Create a CaseBlock record representing a conditional branch to
				1762	// the LHS node if the value being switched on SV is less than C.
				1763	// Otherwise, branch to LHS.
				1764	CaseBlock CB(ISD::SETLT, SV, C, NULL, TrueBB, FalseBB, CR.CaseBB);
				1765
				1766	if (CR.CaseBB == CurMBB)
				1767	visitSwitchCase(CB);
				1768	else
				1769	SwitchCases.push_back(CB);
				1770
				1771	return true;
				1772	}
				1773
				1774	/// handleBitTestsSwitchCase - if current case range has few destination and
				1775	/// range span less, than machine word bitwidth, encode case range into series
				1776	/// of masks and emit bit tests with these masks.
				1777	bool SelectionDAGLowering::handleBitTestsSwitchCase(CaseRec& CR,
				1778	CaseRecVector& WorkList,
				1779	Value* SV,
				1780	MachineBasicBlock* Default){
				1781	unsigned IntPtrBits = TLI.getPointerTy().getSizeInBits();
				1782
				1783	Case& FrontCase = *CR.Range.first;
				1784	Case& BackCase = *(CR.Range.second-1);
				1785
				1786	// Get the MachineFunction which holds the current MBB. This is used when
				1787	// inserting any additional MBBs necessary to represent the switch.
				1788	MachineFunction *CurMF = CurMBB->getParent();
				1789
				1790	unsigned numCmps = 0;
				1791	for (CaseItr I = CR.Range.first, E = CR.Range.second;
				1792	I!=E; ++I) {
				1793	// Single case counts one, case range - two.
				1794	if (I->Low == I->High)
				1795	numCmps +=1;
				1796	else
				1797	numCmps +=2;
				1798	}
				1799
				1800	// Count unique destinations
				1801	SmallSet<MachineBasicBlock*, 4> Dests;
				1802	for (CaseItr I = CR.Range.first, E = CR.Range.second; I!=E; ++I) {
				1803	Dests.insert(I->BB);
				1804	if (Dests.size() > 3)
				1805	// Don't bother the code below, if there are too much unique destinations
				1806	return false;
				1807	}
				1808	DOUT << "Total number of unique destinations: " << Dests.size() << "\n"
				1809	<< "Total number of comparisons: " << numCmps << "\n";
				1810
				1811	// Compute span of values.
				1812	Constant* minValue = FrontCase.Low;
				1813	Constant* maxValue = BackCase.High;
				1814	uint64_t range = cast<ConstantInt>(maxValue)->getSExtValue() -
				1815	cast<ConstantInt>(minValue)->getSExtValue();
				1816	DOUT << "Compare range: " << range << "\n"
				1817	<< "Low bound: " << cast<ConstantInt>(minValue)->getSExtValue() << "\n"
				1818	<< "High bound: " << cast<ConstantInt>(maxValue)->getSExtValue() << "\n";
				1819
				1820	if (range>=IntPtrBits \|\|
				1821	(!(Dests.size() == 1 && numCmps >= 3) &&
				1822	!(Dests.size() == 2 && numCmps >= 5) &&
				1823	!(Dests.size() >= 3 && numCmps >= 6)))
				1824	return false;
				1825
				1826	DOUT << "Emitting bit tests\n";
				1827	int64_t lowBound = 0;
				1828
				1829	// Optimize the case where all the case values fit in a
				1830	// word without having to subtract minValue. In this case,
				1831	// we can optimize away the subtraction.
				1832	if (cast<ConstantInt>(minValue)->getSExtValue() >= 0 &&
				1833	cast<ConstantInt>(maxValue)->getSExtValue() < IntPtrBits) {
				1834	range = cast<ConstantInt>(maxValue)->getSExtValue();
				1835	} else {
				1836	lowBound = cast<ConstantInt>(minValue)->getSExtValue();
				1837	}
				1838
				1839	CaseBitsVector CasesBits;
				1840	unsigned i, count = 0;
				1841
				1842	for (CaseItr I = CR.Range.first, E = CR.Range.second; I!=E; ++I) {
				1843	MachineBasicBlock* Dest = I->BB;
				1844	for (i = 0; i < count; ++i)
				1845	if (Dest == CasesBits[i].BB)
				1846	break;
				1847
				1848	if (i == count) {
				1849	assert((count < 3) && "Too much destinations to test!");
				1850	CasesBits.push_back(CaseBits(0, Dest, 0));
				1851	count++;
				1852	}
				1853
				1854	uint64_t lo = cast<ConstantInt>(I->Low)->getSExtValue() - lowBound;
				1855	uint64_t hi = cast<ConstantInt>(I->High)->getSExtValue() - lowBound;
				1856
				1857	for (uint64_t j = lo; j <= hi; j++) {
				1858	CasesBits[i].Mask \|= 1ULL << j;
				1859	CasesBits[i].Bits++;
				1860	}
				1861
				1862	}
				1863	std::sort(CasesBits.begin(), CasesBits.end(), CaseBitsCmp());
				1864
				1865	BitTestInfo BTC;
				1866
				1867	// Figure out which block is immediately after the current one.
				1868	MachineFunction::iterator BBI = CR.CaseBB;
				1869	++BBI;
				1870
				1871	const BasicBlock *LLVMBB = CR.CaseBB->getBasicBlock();
				1872
				1873	DOUT << "Cases:\n";
				1874	for (unsigned i = 0, e = CasesBits.size(); i!=e; ++i) {
				1875	DOUT << "Mask: " << CasesBits[i].Mask << ", Bits: " << CasesBits[i].Bits
				1876	<< ", BB: " << CasesBits[i].BB << "\n";
				1877
				1878	MachineBasicBlock *CaseBB = CurMF->CreateMachineBasicBlock(LLVMBB);
				1879	CurMF->insert(BBI, CaseBB);
				1880	BTC.push_back(BitTestCase(CasesBits[i].Mask,
				1881	CaseBB,
				1882	CasesBits[i].BB));
				1883	}
				1884
				1885	BitTestBlock BTB(lowBound, range, SV,
				1886	-1U, (CR.CaseBB == CurMBB),
				1887	CR.CaseBB, Default, BTC);
				1888
				1889	if (CR.CaseBB == CurMBB)
				1890	visitBitTestHeader(BTB);
				1891
				1892	BitTestCases.push_back(BTB);
				1893
				1894	return true;
				1895	}
				1896
				1897
				1898	/// Clusterify - Transform simple list of Cases into list of CaseRange's
				1899	unsigned SelectionDAGLowering::Clusterify(CaseVector& Cases,
				1900	const SwitchInst& SI) {
				1901	unsigned numCmps = 0;
				1902
				1903	// Start with "simple" cases
				1904	for (unsigned i = 1; i < SI.getNumSuccessors(); ++i) {
				1905	MachineBasicBlock *SMBB = FuncInfo.MBBMap[SI.getSuccessor(i)];
				1906	Cases.push_back(Case(SI.getSuccessorValue(i),
				1907	SI.getSuccessorValue(i),
				1908	SMBB));
				1909	}
				1910	std::sort(Cases.begin(), Cases.end(), CaseCmp());
				1911
				1912	// Merge case into clusters
				1913	if (Cases.size()>=2)
				1914	// Must recompute end() each iteration because it may be
				1915	// invalidated by erase if we hold on to it
				1916	for (CaseItr I=Cases.begin(), J=++(Cases.begin()); J!=Cases.end(); ) {
				1917	int64_t nextValue = cast<ConstantInt>(J->Low)->getSExtValue();
				1918	int64_t currentValue = cast<ConstantInt>(I->High)->getSExtValue();
				1919	MachineBasicBlock* nextBB = J->BB;
				1920	MachineBasicBlock* currentBB = I->BB;
				1921
				1922	// If the two neighboring cases go to the same destination, merge them
				1923	// into a single case.
				1924	if ((nextValue-currentValue==1) && (currentBB == nextBB)) {
				1925	I->High = J->High;
				1926	J = Cases.erase(J);
				1927	} else {
				1928	I = J++;
				1929	}
				1930	}
				1931
				1932	for (CaseItr I=Cases.begin(), E=Cases.end(); I!=E; ++I, ++numCmps) {
				1933	if (I->Low != I->High)
				1934	// A range counts double, since it requires two compares.
				1935	++numCmps;
				1936	}
				1937
				1938	return numCmps;
				1939	}
				1940
				1941	void SelectionDAGLowering::visitSwitch(SwitchInst &SI) {
				1942	// Figure out which block is immediately after the current one.
				1943	MachineBasicBlock *NextBlock = 0;
				1944	MachineFunction::iterator BBI = CurMBB;
				1945
				1946	MachineBasicBlock *Default = FuncInfo.MBBMap[SI.getDefaultDest()];
				1947
				1948	// If there is only the default destination, branch to it if it is not the
				1949	// next basic block. Otherwise, just fall through.
				1950	if (SI.getNumOperands() == 2) {
				1951	// Update machine-CFG edges.
				1952
				1953	// If this is not a fall-through branch, emit the branch.
				1954	CurMBB->addSuccessor(Default);
				1955	if (Default != NextBlock)
				1956	DAG.setRoot(DAG.getNode(ISD::BR, MVT::Other, getControlRoot(),
				1957	DAG.getBasicBlock(Default)));
				1958
				1959	return;
				1960	}
				1961
				1962	// If there are any non-default case statements, create a vector of Cases
				1963	// representing each one, and sort the vector so that we can efficiently
				1964	// create a binary search tree from them.
				1965	CaseVector Cases;
				1966	unsigned numCmps = Clusterify(Cases, SI);
				1967	DOUT << "Clusterify finished. Total clusters: " << Cases.size()
				1968	<< ". Total compares: " << numCmps << "\n";
				1969
				1970	// Get the Value to be switched on and default basic blocks, which will be
				1971	// inserted into CaseBlock records, representing basic blocks in the binary
				1972	// search tree.
				1973	Value *SV = SI.getOperand(0);
				1974
				1975	// Push the initial CaseRec onto the worklist
				1976	CaseRecVector WorkList;
				1977	WorkList.push_back(CaseRec(CurMBB,0,0,CaseRange(Cases.begin(),Cases.end())));
				1978
				1979	while (!WorkList.empty()) {
				1980	// Grab a record representing a case range to process off the worklist
				1981	CaseRec CR = WorkList.back();
				1982	WorkList.pop_back();
				1983
				1984	if (handleBitTestsSwitchCase(CR, WorkList, SV, Default))
				1985	continue;
				1986
				1987	// If the range has few cases (two or less) emit a series of specific
				1988	// tests.
				1989	if (handleSmallSwitchRange(CR, WorkList, SV, Default))
				1990	continue;
				1991
				1992	// If the switch has more than 5 blocks, and at least 40% dense, and the
				1993	// target supports indirect branches, then emit a jump table rather than
				1994	// lowering the switch to a binary tree of conditional branches.
				1995	if (handleJTSwitchCase(CR, WorkList, SV, Default))
				1996	continue;
				1997
				1998	// Emit binary tree. We need to pick a pivot, and push left and right ranges
				1999	// onto the worklist. Leafs are handled via handleSmallSwitchRange() call.
				2000	handleBTSplitSwitchCase(CR, WorkList, SV, Default);
				2001	}
				2002	}
				2003
				2004
				2005	void SelectionDAGLowering::visitSub(User &I) {
				2006	// -0.0 - X --> fneg
				2007	const Type *Ty = I.getType();
				2008	if (isa<VectorType>(Ty)) {
				2009	if (ConstantVector *CV = dyn_cast<ConstantVector>(I.getOperand(0))) {
				2010	const VectorType *DestTy = cast<VectorType>(I.getType());
				2011	const Type *ElTy = DestTy->getElementType();
				2012	if (ElTy->isFloatingPoint()) {
				2013	unsigned VL = DestTy->getNumElements();
				2014	std::vector<Constant*> NZ(VL, ConstantFP::getNegativeZero(ElTy));
				2015	Constant *CNZ = ConstantVector::get(&NZ[0], NZ.size());
				2016	if (CV == CNZ) {
				2017	SDValue Op2 = getValue(I.getOperand(1));
				2018	setValue(&I, DAG.getNode(ISD::FNEG, Op2.getValueType(), Op2));
				2019	return;
				2020	}
				2021	}
				2022	}
				2023	}
				2024	if (Ty->isFloatingPoint()) {
				2025	if (ConstantFP *CFP = dyn_cast<ConstantFP>(I.getOperand(0)))
				2026	if (CFP->isExactlyValue(ConstantFP::getNegativeZero(Ty)->getValueAPF())) {
				2027	SDValue Op2 = getValue(I.getOperand(1));
				2028	setValue(&I, DAG.getNode(ISD::FNEG, Op2.getValueType(), Op2));
				2029	return;
				2030	}
				2031	}
				2032
				2033	visitBinary(I, Ty->isFPOrFPVector() ? ISD::FSUB : ISD::SUB);
				2034	}
				2035
				2036	void SelectionDAGLowering::visitBinary(User &I, unsigned OpCode) {
				2037	SDValue Op1 = getValue(I.getOperand(0));
				2038	SDValue Op2 = getValue(I.getOperand(1));
				2039
				2040	setValue(&I, DAG.getNode(OpCode, Op1.getValueType(), Op1, Op2));
				2041	}
				2042
				2043	void SelectionDAGLowering::visitShift(User &I, unsigned Opcode) {
				2044	SDValue Op1 = getValue(I.getOperand(0));
				2045	SDValue Op2 = getValue(I.getOperand(1));
				2046	if (!isa<VectorType>(I.getType())) {
				2047	if (TLI.getShiftAmountTy().bitsLT(Op2.getValueType()))
				2048	Op2 = DAG.getNode(ISD::TRUNCATE, TLI.getShiftAmountTy(), Op2);
				2049	else if (TLI.getShiftAmountTy().bitsGT(Op2.getValueType()))
				2050	Op2 = DAG.getNode(ISD::ANY_EXTEND, TLI.getShiftAmountTy(), Op2);
				2051	}
				2052
				2053	setValue(&I, DAG.getNode(Opcode, Op1.getValueType(), Op1, Op2));
				2054	}
				2055
				2056	void SelectionDAGLowering::visitICmp(User &I) {
				2057	ICmpInst::Predicate predicate = ICmpInst::BAD_ICMP_PREDICATE;
				2058	if (ICmpInst *IC = dyn_cast<ICmpInst>(&I))
				2059	predicate = IC->getPredicate();
				2060	else if (ConstantExpr *IC = dyn_cast<ConstantExpr>(&I))
				2061	predicate = ICmpInst::Predicate(IC->getPredicate());
				2062	SDValue Op1 = getValue(I.getOperand(0));
				2063	SDValue Op2 = getValue(I.getOperand(1));
				2064	ISD::CondCode Opcode;
				2065	switch (predicate) {
				2066	case ICmpInst::ICMP_EQ : Opcode = ISD::SETEQ; break;
				2067	case ICmpInst::ICMP_NE : Opcode = ISD::SETNE; break;
				2068	case ICmpInst::ICMP_UGT : Opcode = ISD::SETUGT; break;
				2069	case ICmpInst::ICMP_UGE : Opcode = ISD::SETUGE; break;
				2070	case ICmpInst::ICMP_ULT : Opcode = ISD::SETULT; break;
				2071	case ICmpInst::ICMP_ULE : Opcode = ISD::SETULE; break;
				2072	case ICmpInst::ICMP_SGT : Opcode = ISD::SETGT; break;
				2073	case ICmpInst::ICMP_SGE : Opcode = ISD::SETGE; break;
				2074	case ICmpInst::ICMP_SLT : Opcode = ISD::SETLT; break;
				2075	case ICmpInst::ICMP_SLE : Opcode = ISD::SETLE; break;
				2076	default:
				2077	assert(!"Invalid ICmp predicate value");
				2078	Opcode = ISD::SETEQ;
				2079	break;
				2080	}
				2081	setValue(&I, DAG.getSetCC(MVT::i1, Op1, Op2, Opcode));
				2082	}
				2083
				2084	void SelectionDAGLowering::visitFCmp(User &I) {
				2085	FCmpInst::Predicate predicate = FCmpInst::BAD_FCMP_PREDICATE;
				2086	if (FCmpInst *FC = dyn_cast<FCmpInst>(&I))
				2087	predicate = FC->getPredicate();
				2088	else if (ConstantExpr *FC = dyn_cast<ConstantExpr>(&I))
				2089	predicate = FCmpInst::Predicate(FC->getPredicate());
				2090	SDValue Op1 = getValue(I.getOperand(0));
				2091	SDValue Op2 = getValue(I.getOperand(1));
				2092	ISD::CondCode Condition, FOC, FPC;
				2093	switch (predicate) {
				2094	case FCmpInst::FCMP_FALSE: FOC = FPC = ISD::SETFALSE; break;
				2095	case FCmpInst::FCMP_OEQ: FOC = ISD::SETEQ; FPC = ISD::SETOEQ; break;
				2096	case FCmpInst::FCMP_OGT: FOC = ISD::SETGT; FPC = ISD::SETOGT; break;
				2097	case FCmpInst::FCMP_OGE: FOC = ISD::SETGE; FPC = ISD::SETOGE; break;
				2098	case FCmpInst::FCMP_OLT: FOC = ISD::SETLT; FPC = ISD::SETOLT; break;
				2099	case FCmpInst::FCMP_OLE: FOC = ISD::SETLE; FPC = ISD::SETOLE; break;
				2100	case FCmpInst::FCMP_ONE: FOC = ISD::SETNE; FPC = ISD::SETONE; break;
				2101	case FCmpInst::FCMP_ORD: FOC = FPC = ISD::SETO; break;
				2102	case FCmpInst::FCMP_UNO: FOC = FPC = ISD::SETUO; break;
				2103	case FCmpInst::FCMP_UEQ: FOC = ISD::SETEQ; FPC = ISD::SETUEQ; break;
				2104	case FCmpInst::FCMP_UGT: FOC = ISD::SETGT; FPC = ISD::SETUGT; break;
				2105	case FCmpInst::FCMP_UGE: FOC = ISD::SETGE; FPC = ISD::SETUGE; break;
				2106	case FCmpInst::FCMP_ULT: FOC = ISD::SETLT; FPC = ISD::SETULT; break;
				2107	case FCmpInst::FCMP_ULE: FOC = ISD::SETLE; FPC = ISD::SETULE; break;
				2108	case FCmpInst::FCMP_UNE: FOC = ISD::SETNE; FPC = ISD::SETUNE; break;
				2109	case FCmpInst::FCMP_TRUE: FOC = FPC = ISD::SETTRUE; break;
				2110	default:
				2111	assert(!"Invalid FCmp predicate value");
				2112	FOC = FPC = ISD::SETFALSE;
				2113	break;
				2114	}
				2115	if (FiniteOnlyFPMath())
				2116	Condition = FOC;
				2117	else
				2118	Condition = FPC;
				2119	setValue(&I, DAG.getSetCC(MVT::i1, Op1, Op2, Condition));
				2120	}
				2121
				2122	void SelectionDAGLowering::visitVICmp(User &I) {
				2123	ICmpInst::Predicate predicate = ICmpInst::BAD_ICMP_PREDICATE;
				2124	if (VICmpInst *IC = dyn_cast<VICmpInst>(&I))
				2125	predicate = IC->getPredicate();
				2126	else if (ConstantExpr *IC = dyn_cast<ConstantExpr>(&I))
				2127	predicate = ICmpInst::Predicate(IC->getPredicate());
				2128	SDValue Op1 = getValue(I.getOperand(0));
				2129	SDValue Op2 = getValue(I.getOperand(1));
				2130	ISD::CondCode Opcode;
				2131	switch (predicate) {
				2132	case ICmpInst::ICMP_EQ : Opcode = ISD::SETEQ; break;
				2133	case ICmpInst::ICMP_NE : Opcode = ISD::SETNE; break;
				2134	case ICmpInst::ICMP_UGT : Opcode = ISD::SETUGT; break;
				2135	case ICmpInst::ICMP_UGE : Opcode = ISD::SETUGE; break;
				2136	case ICmpInst::ICMP_ULT : Opcode = ISD::SETULT; break;
				2137	case ICmpInst::ICMP_ULE : Opcode = ISD::SETULE; break;
				2138	case ICmpInst::ICMP_SGT : Opcode = ISD::SETGT; break;
				2139	case ICmpInst::ICMP_SGE : Opcode = ISD::SETGE; break;
				2140	case ICmpInst::ICMP_SLT : Opcode = ISD::SETLT; break;
				2141	case ICmpInst::ICMP_SLE : Opcode = ISD::SETLE; break;
				2142	default:
				2143	assert(!"Invalid ICmp predicate value");
				2144	Opcode = ISD::SETEQ;
				2145	break;
				2146	}
				2147	setValue(&I, DAG.getVSetCC(Op1.getValueType(), Op1, Op2, Opcode));
				2148	}
				2149
				2150	void SelectionDAGLowering::visitVFCmp(User &I) {
				2151	FCmpInst::Predicate predicate = FCmpInst::BAD_FCMP_PREDICATE;
				2152	if (VFCmpInst *FC = dyn_cast<VFCmpInst>(&I))
				2153	predicate = FC->getPredicate();
				2154	else if (ConstantExpr *FC = dyn_cast<ConstantExpr>(&I))
				2155	predicate = FCmpInst::Predicate(FC->getPredicate());
				2156	SDValue Op1 = getValue(I.getOperand(0));
				2157	SDValue Op2 = getValue(I.getOperand(1));
				2158	ISD::CondCode Condition, FOC, FPC;
				2159	switch (predicate) {
				2160	case FCmpInst::FCMP_FALSE: FOC = FPC = ISD::SETFALSE; break;
				2161	case FCmpInst::FCMP_OEQ: FOC = ISD::SETEQ; FPC = ISD::SETOEQ; break;
				2162	case FCmpInst::FCMP_OGT: FOC = ISD::SETGT; FPC = ISD::SETOGT; break;
				2163	case FCmpInst::FCMP_OGE: FOC = ISD::SETGE; FPC = ISD::SETOGE; break;
				2164	case FCmpInst::FCMP_OLT: FOC = ISD::SETLT; FPC = ISD::SETOLT; break;
				2165	case FCmpInst::FCMP_OLE: FOC = ISD::SETLE; FPC = ISD::SETOLE; break;
				2166	case FCmpInst::FCMP_ONE: FOC = ISD::SETNE; FPC = ISD::SETONE; break;
				2167	case FCmpInst::FCMP_ORD: FOC = FPC = ISD::SETO; break;
				2168	case FCmpInst::FCMP_UNO: FOC = FPC = ISD::SETUO; break;
				2169	case FCmpInst::FCMP_UEQ: FOC = ISD::SETEQ; FPC = ISD::SETUEQ; break;
				2170	case FCmpInst::FCMP_UGT: FOC = ISD::SETGT; FPC = ISD::SETUGT; break;
				2171	case FCmpInst::FCMP_UGE: FOC = ISD::SETGE; FPC = ISD::SETUGE; break;
				2172	case FCmpInst::FCMP_ULT: FOC = ISD::SETLT; FPC = ISD::SETULT; break;
				2173	case FCmpInst::FCMP_ULE: FOC = ISD::SETLE; FPC = ISD::SETULE; break;
				2174	case FCmpInst::FCMP_UNE: FOC = ISD::SETNE; FPC = ISD::SETUNE; break;
				2175	case FCmpInst::FCMP_TRUE: FOC = FPC = ISD::SETTRUE; break;
				2176	default:
				2177	assert(!"Invalid VFCmp predicate value");
				2178	FOC = FPC = ISD::SETFALSE;
				2179	break;
				2180	}
				2181	if (FiniteOnlyFPMath())
				2182	Condition = FOC;
				2183	else
				2184	Condition = FPC;
				2185
				2186	MVT DestVT = TLI.getValueType(I.getType());
				2187
				2188	setValue(&I, DAG.getVSetCC(DestVT, Op1, Op2, Condition));
				2189	}
				2190
				2191	void SelectionDAGLowering::visitSelect(User &I) {
				2192	SDValue Cond = getValue(I.getOperand(0));
				2193	SDValue TrueVal = getValue(I.getOperand(1));
				2194	SDValue FalseVal = getValue(I.getOperand(2));
				2195	setValue(&I, DAG.getNode(ISD::SELECT, TrueVal.getValueType(), Cond,
				2196	TrueVal, FalseVal));
				2197	}
				2198
				2199
				2200	void SelectionDAGLowering::visitTrunc(User &I) {
				2201	// TruncInst cannot be a no-op cast because sizeof(src) > sizeof(dest).
				2202	SDValue N = getValue(I.getOperand(0));
				2203	MVT DestVT = TLI.getValueType(I.getType());
				2204	setValue(&I, DAG.getNode(ISD::TRUNCATE, DestVT, N));
				2205	}
				2206
				2207	void SelectionDAGLowering::visitZExt(User &I) {
				2208	// ZExt cannot be a no-op cast because sizeof(src) < sizeof(dest).
				2209	// ZExt also can't be a cast to bool for same reason. So, nothing much to do
				2210	SDValue N = getValue(I.getOperand(0));
				2211	MVT DestVT = TLI.getValueType(I.getType());
				2212	setValue(&I, DAG.getNode(ISD::ZERO_EXTEND, DestVT, N));
				2213	}
				2214
				2215	void SelectionDAGLowering::visitSExt(User &I) {
				2216	// SExt cannot be a no-op cast because sizeof(src) < sizeof(dest).
				2217	// SExt also can't be a cast to bool for same reason. So, nothing much to do
				2218	SDValue N = getValue(I.getOperand(0));
				2219	MVT DestVT = TLI.getValueType(I.getType());
				2220	setValue(&I, DAG.getNode(ISD::SIGN_EXTEND, DestVT, N));
				2221	}
				2222
				2223	void SelectionDAGLowering::visitFPTrunc(User &I) {
				2224	// FPTrunc is never a no-op cast, no need to check
				2225	SDValue N = getValue(I.getOperand(0));
				2226	MVT DestVT = TLI.getValueType(I.getType());
				2227	setValue(&I, DAG.getNode(ISD::FP_ROUND, DestVT, N, DAG.getIntPtrConstant(0)));
				2228	}
				2229
				2230	void SelectionDAGLowering::visitFPExt(User &I){
				2231	// FPTrunc is never a no-op cast, no need to check
				2232	SDValue N = getValue(I.getOperand(0));
				2233	MVT DestVT = TLI.getValueType(I.getType());
				2234	setValue(&I, DAG.getNode(ISD::FP_EXTEND, DestVT, N));
				2235	}
				2236
				2237	void SelectionDAGLowering::visitFPToUI(User &I) {
				2238	// FPToUI is never a no-op cast, no need to check
				2239	SDValue N = getValue(I.getOperand(0));
				2240	MVT DestVT = TLI.getValueType(I.getType());
				2241	setValue(&I, DAG.getNode(ISD::FP_TO_UINT, DestVT, N));
				2242	}
				2243
				2244	void SelectionDAGLowering::visitFPToSI(User &I) {
				2245	// FPToSI is never a no-op cast, no need to check
				2246	SDValue N = getValue(I.getOperand(0));
				2247	MVT DestVT = TLI.getValueType(I.getType());
				2248	setValue(&I, DAG.getNode(ISD::FP_TO_SINT, DestVT, N));
				2249	}
				2250
				2251	void SelectionDAGLowering::visitUIToFP(User &I) {
				2252	// UIToFP is never a no-op cast, no need to check
				2253	SDValue N = getValue(I.getOperand(0));
				2254	MVT DestVT = TLI.getValueType(I.getType());
				2255	setValue(&I, DAG.getNode(ISD::UINT_TO_FP, DestVT, N));
				2256	}
				2257
				2258	void SelectionDAGLowering::visitSIToFP(User &I){
				2259	// UIToFP is never a no-op cast, no need to check
				2260	SDValue N = getValue(I.getOperand(0));
				2261	MVT DestVT = TLI.getValueType(I.getType());
				2262	setValue(&I, DAG.getNode(ISD::SINT_TO_FP, DestVT, N));
				2263	}
				2264
				2265	void SelectionDAGLowering::visitPtrToInt(User &I) {
				2266	// What to do depends on the size of the integer and the size of the pointer.
				2267	// We can either truncate, zero extend, or no-op, accordingly.
				2268	SDValue N = getValue(I.getOperand(0));
				2269	MVT SrcVT = N.getValueType();
				2270	MVT DestVT = TLI.getValueType(I.getType());
				2271	SDValue Result;
				2272	if (DestVT.bitsLT(SrcVT))
				2273	Result = DAG.getNode(ISD::TRUNCATE, DestVT, N);
				2274	else
				2275	// Note: ZERO_EXTEND can handle cases where the sizes are equal too
				2276	Result = DAG.getNode(ISD::ZERO_EXTEND, DestVT, N);
				2277	setValue(&I, Result);
				2278	}
				2279
				2280	void SelectionDAGLowering::visitIntToPtr(User &I) {
				2281	// What to do depends on the size of the integer and the size of the pointer.
				2282	// We can either truncate, zero extend, or no-op, accordingly.
				2283	SDValue N = getValue(I.getOperand(0));
				2284	MVT SrcVT = N.getValueType();
				2285	MVT DestVT = TLI.getValueType(I.getType());
				2286	if (DestVT.bitsLT(SrcVT))
				2287	setValue(&I, DAG.getNode(ISD::TRUNCATE, DestVT, N));
				2288	else
				2289	// Note: ZERO_EXTEND can handle cases where the sizes are equal too
				2290	setValue(&I, DAG.getNode(ISD::ZERO_EXTEND, DestVT, N));
				2291	}
				2292
				2293	void SelectionDAGLowering::visitBitCast(User &I) {
				2294	SDValue N = getValue(I.getOperand(0));
				2295	MVT DestVT = TLI.getValueType(I.getType());
				2296
				2297	// BitCast assures us that source and destination are the same size so this
				2298	// is either a BIT_CONVERT or a no-op.
				2299	if (DestVT != N.getValueType())
				2300	setValue(&I, DAG.getNode(ISD::BIT_CONVERT, DestVT, N)); // convert types
				2301	else
				2302	setValue(&I, N); // noop cast.
				2303	}
				2304
				2305	void SelectionDAGLowering::visitInsertElement(User &I) {
				2306	SDValue InVec = getValue(I.getOperand(0));
				2307	SDValue InVal = getValue(I.getOperand(1));
				2308	SDValue InIdx = DAG.getNode(ISD::ZERO_EXTEND, TLI.getPointerTy(),
				2309	getValue(I.getOperand(2)));
				2310
				2311	setValue(&I, DAG.getNode(ISD::INSERT_VECTOR_ELT,
				2312	TLI.getValueType(I.getType()),
				2313	InVec, InVal, InIdx));
				2314	}
				2315
				2316	void SelectionDAGLowering::visitExtractElement(User &I) {
				2317	SDValue InVec = getValue(I.getOperand(0));
				2318	SDValue InIdx = DAG.getNode(ISD::ZERO_EXTEND, TLI.getPointerTy(),
				2319	getValue(I.getOperand(1)));
				2320	setValue(&I, DAG.getNode(ISD::EXTRACT_VECTOR_ELT,
				2321	TLI.getValueType(I.getType()), InVec, InIdx));
				2322	}
				2323
				2324	void SelectionDAGLowering::visitShuffleVector(User &I) {
				2325	SDValue V1 = getValue(I.getOperand(0));
				2326	SDValue V2 = getValue(I.getOperand(1));
				2327	SDValue Mask = getValue(I.getOperand(2));
				2328
				2329	setValue(&I, DAG.getNode(ISD::VECTOR_SHUFFLE,
				2330	TLI.getValueType(I.getType()),
				2331	V1, V2, Mask));
				2332	}
				2333
				2334	void SelectionDAGLowering::visitInsertValue(InsertValueInst &I) {
				2335	const Value *Op0 = I.getOperand(0);
				2336	const Value *Op1 = I.getOperand(1);
				2337	const Type *AggTy = I.getType();
				2338	const Type *ValTy = Op1->getType();
				2339	bool IntoUndef = isa<UndefValue>(Op0);
				2340	bool FromUndef = isa<UndefValue>(Op1);
				2341
				2342	unsigned LinearIndex = ComputeLinearIndex(TLI, AggTy,
				2343	I.idx_begin(), I.idx_end());
				2344
				2345	SmallVector<MVT, 4> AggValueVTs;
				2346	ComputeValueVTs(TLI, AggTy, AggValueVTs);
				2347	SmallVector<MVT, 4> ValValueVTs;
				2348	ComputeValueVTs(TLI, ValTy, ValValueVTs);
				2349
				2350	unsigned NumAggValues = AggValueVTs.size();
				2351	unsigned NumValValues = ValValueVTs.size();
				2352	SmallVector<SDValue, 4> Values(NumAggValues);
				2353
				2354	SDValue Agg = getValue(Op0);
				2355	SDValue Val = getValue(Op1);
				2356	unsigned i = 0;
				2357	// Copy the beginning value(s) from the original aggregate.
				2358	for (; i != LinearIndex; ++i)
				2359	Values[i] = IntoUndef ? DAG.getNode(ISD::UNDEF, AggValueVTs[i]) :
				2360	SDValue(Agg.getNode(), Agg.getResNo() + i);
				2361	// Copy values from the inserted value(s).
				2362	for (; i != LinearIndex + NumValValues; ++i)
				2363	Values[i] = FromUndef ? DAG.getNode(ISD::UNDEF, AggValueVTs[i]) :
				2364	SDValue(Val.getNode(), Val.getResNo() + i - LinearIndex);
				2365	// Copy remaining value(s) from the original aggregate.
				2366	for (; i != NumAggValues; ++i)
				2367	Values[i] = IntoUndef ? DAG.getNode(ISD::UNDEF, AggValueVTs[i]) :
				2368	SDValue(Agg.getNode(), Agg.getResNo() + i);
				2369
				2370	setValue(&I, DAG.getMergeValues(DAG.getVTList(&AggValueVTs[0], NumAggValues),
				2371	&Values[0], NumAggValues));
				2372	}
				2373
				2374	void SelectionDAGLowering::visitExtractValue(ExtractValueInst &I) {
				2375	const Value *Op0 = I.getOperand(0);
				2376	const Type *AggTy = Op0->getType();
				2377	const Type *ValTy = I.getType();
				2378	bool OutOfUndef = isa<UndefValue>(Op0);
				2379
				2380	unsigned LinearIndex = ComputeLinearIndex(TLI, AggTy,
				2381	I.idx_begin(), I.idx_end());
				2382
				2383	SmallVector<MVT, 4> ValValueVTs;
				2384	ComputeValueVTs(TLI, ValTy, ValValueVTs);
				2385
				2386	unsigned NumValValues = ValValueVTs.size();
				2387	SmallVector<SDValue, 4> Values(NumValValues);
				2388
				2389	SDValue Agg = getValue(Op0);
				2390	// Copy out the selected value(s).
				2391	for (unsigned i = LinearIndex; i != LinearIndex + NumValValues; ++i)
				2392	Values[i - LinearIndex] =
				2393	OutOfUndef ? DAG.getNode(ISD::UNDEF, Agg.getNode()->getValueType(Agg.getResNo() + i)) :
				2394	SDValue(Agg.getNode(), Agg.getResNo() + i);
				2395
				2396	setValue(&I, DAG.getMergeValues(DAG.getVTList(&ValValueVTs[0], NumValValues),
				2397	&Values[0], NumValValues));
				2398	}
				2399
				2400
				2401	void SelectionDAGLowering::visitGetElementPtr(User &I) {
				2402	SDValue N = getValue(I.getOperand(0));
				2403	const Type *Ty = I.getOperand(0)->getType();
				2404
				2405	for (GetElementPtrInst::op_iterator OI = I.op_begin()+1, E = I.op_end();
				2406	OI != E; ++OI) {
				2407	Value Idx = OI;
				2408	if (const StructType *StTy = dyn_cast<StructType>(Ty)) {
				2409	unsigned Field = cast<ConstantInt>(Idx)->getZExtValue();
				2410	if (Field) {
				2411	// N = N + Offset
				2412	uint64_t Offset = TD->getStructLayout(StTy)->getElementOffset(Field);
				2413	N = DAG.getNode(ISD::ADD, N.getValueType(), N,
				2414	DAG.getIntPtrConstant(Offset));
				2415	}
				2416	Ty = StTy->getElementType(Field);
				2417	} else {
				2418	Ty = cast<SequentialType>(Ty)->getElementType();
				2419
				2420	// If this is a constant subscript, handle it quickly.
				2421	if (ConstantInt *CI = dyn_cast<ConstantInt>(Idx)) {
				2422	if (CI->getZExtValue() == 0) continue;
				2423	uint64_t Offs =
				2424	TD->getABITypeSize(Ty)*cast<ConstantInt>(CI)->getSExtValue();
				2425	N = DAG.getNode(ISD::ADD, N.getValueType(), N,
				2426	DAG.getIntPtrConstant(Offs));
				2427	continue;
				2428	}
				2429
				2430	// N = N + Idx * ElementSize;
				2431	uint64_t ElementSize = TD->getABITypeSize(Ty);
				2432	SDValue IdxN = getValue(Idx);
				2433
				2434	// If the index is smaller or larger than intptr_t, truncate or extend
				2435	// it.
				2436	if (IdxN.getValueType().bitsLT(N.getValueType()))
				2437	IdxN = DAG.getNode(ISD::SIGN_EXTEND, N.getValueType(), IdxN);
				2438	else if (IdxN.getValueType().bitsGT(N.getValueType()))
				2439	IdxN = DAG.getNode(ISD::TRUNCATE, N.getValueType(), IdxN);
				2440
				2441	// If this is a multiply by a power of two, turn it into a shl
				2442	// immediately. This is a very common case.
				2443	if (ElementSize != 1) {
				2444	if (isPowerOf2_64(ElementSize)) {
				2445	unsigned Amt = Log2_64(ElementSize);
				2446	IdxN = DAG.getNode(ISD::SHL, N.getValueType(), IdxN,
				2447	DAG.getConstant(Amt, TLI.getShiftAmountTy()));
				2448	} else {
				2449	SDValue Scale = DAG.getIntPtrConstant(ElementSize);
				2450	IdxN = DAG.getNode(ISD::MUL, N.getValueType(), IdxN, Scale);
				2451	}
				2452	}
				2453
				2454	N = DAG.getNode(ISD::ADD, N.getValueType(), N, IdxN);
				2455	}
				2456	}
				2457	setValue(&I, N);
				2458	}
				2459
				2460	void SelectionDAGLowering::visitAlloca(AllocaInst &I) {
				2461	// If this is a fixed sized alloca in the entry block of the function,
				2462	// allocate it statically on the stack.
				2463	if (FuncInfo.StaticAllocaMap.count(&I))
				2464	return; // getValue will auto-populate this.
				2465
				2466	const Type *Ty = I.getAllocatedType();
				2467	uint64_t TySize = TLI.getTargetData()->getABITypeSize(Ty);
				2468	unsigned Align =
				2469	std::max((unsigned)TLI.getTargetData()->getPrefTypeAlignment(Ty),
				2470	I.getAlignment());
				2471
				2472	SDValue AllocSize = getValue(I.getArraySize());
				2473	MVT IntPtr = TLI.getPointerTy();
				2474	if (IntPtr.bitsLT(AllocSize.getValueType()))
				2475	AllocSize = DAG.getNode(ISD::TRUNCATE, IntPtr, AllocSize);
				2476	else if (IntPtr.bitsGT(AllocSize.getValueType()))
				2477	AllocSize = DAG.getNode(ISD::ZERO_EXTEND, IntPtr, AllocSize);
				2478
				2479	AllocSize = DAG.getNode(ISD::MUL, IntPtr, AllocSize,
				2480	DAG.getIntPtrConstant(TySize));
				2481
				2482	// Handle alignment. If the requested alignment is less than or equal to
				2483	// the stack alignment, ignore it. If the size is greater than or equal to
				2484	// the stack alignment, we note this in the DYNAMIC_STACKALLOC node.
				2485	unsigned StackAlign =
				2486	TLI.getTargetMachine().getFrameInfo()->getStackAlignment();
				2487	if (Align <= StackAlign)
				2488	Align = 0;
				2489
				2490	// Round the size of the allocation up to the stack alignment size
				2491	// by add SA-1 to the size.
				2492	AllocSize = DAG.getNode(ISD::ADD, AllocSize.getValueType(), AllocSize,
				2493	DAG.getIntPtrConstant(StackAlign-1));
				2494	// Mask out the low bits for alignment purposes.
				2495	AllocSize = DAG.getNode(ISD::AND, AllocSize.getValueType(), AllocSize,
				2496	DAG.getIntPtrConstant(~(uint64_t)(StackAlign-1)));
				2497
				2498	SDValue Ops[] = { getRoot(), AllocSize, DAG.getIntPtrConstant(Align) };
				2499	const MVT *VTs = DAG.getNodeValueTypes(AllocSize.getValueType(),
				2500	MVT::Other);
				2501	SDValue DSA = DAG.getNode(ISD::DYNAMIC_STACKALLOC, VTs, 2, Ops, 3);
				2502	setValue(&I, DSA);
				2503	DAG.setRoot(DSA.getValue(1));
				2504
				2505	// Inform the Frame Information that we have just allocated a variable-sized
				2506	// object.
				2507	CurMBB->getParent()->getFrameInfo()->CreateVariableSizedObject();
				2508	}
				2509
				2510	void SelectionDAGLowering::visitLoad(LoadInst &I) {
				2511	const Value *SV = I.getOperand(0);
				2512	SDValue Ptr = getValue(SV);
				2513
				2514	const Type *Ty = I.getType();
				2515	bool isVolatile = I.isVolatile();
				2516	unsigned Alignment = I.getAlignment();
				2517
				2518	SmallVector<MVT, 4> ValueVTs;
				2519	SmallVector<uint64_t, 4> Offsets;
				2520	ComputeValueVTs(TLI, Ty, ValueVTs, &Offsets);
				2521	unsigned NumValues = ValueVTs.size();
				2522	if (NumValues == 0)
				2523	return;
				2524
				2525	SDValue Root;
				2526	bool ConstantMemory = false;
				2527	if (I.isVolatile())
				2528	// Serialize volatile loads with other side effects.
				2529	Root = getRoot();
				2530	else if (AA->pointsToConstantMemory(SV)) {
				2531	// Do not serialize (non-volatile) loads of constant memory with anything.
				2532	Root = DAG.getEntryNode();
				2533	ConstantMemory = true;
				2534	} else {
				2535	// Do not serialize non-volatile loads against each other.
				2536	Root = DAG.getRoot();
				2537	}
				2538
				2539	SmallVector<SDValue, 4> Values(NumValues);
				2540	SmallVector<SDValue, 4> Chains(NumValues);
				2541	MVT PtrVT = Ptr.getValueType();
				2542	for (unsigned i = 0; i != NumValues; ++i) {
				2543	SDValue L = DAG.getLoad(ValueVTs[i], Root,
				2544	DAG.getNode(ISD::ADD, PtrVT, Ptr,
				2545	DAG.getConstant(Offsets[i], PtrVT)),
				2546	SV, Offsets[i],
				2547	isVolatile, Alignment);
				2548	Values[i] = L;
				2549	Chains[i] = L.getValue(1);
				2550	}
				2551
				2552	if (!ConstantMemory) {
				2553	SDValue Chain = DAG.getNode(ISD::TokenFactor, MVT::Other,
				2554	&Chains[0], NumValues);
				2555	if (isVolatile)
				2556	DAG.setRoot(Chain);
				2557	else
				2558	PendingLoads.push_back(Chain);
				2559	}
				2560
				2561	setValue(&I, DAG.getMergeValues(DAG.getVTList(&ValueVTs[0], NumValues),
				2562	&Values[0], NumValues));
				2563	}
				2564
				2565
				2566	void SelectionDAGLowering::visitStore(StoreInst &I) {
				2567	Value *SrcV = I.getOperand(0);
				2568	Value *PtrV = I.getOperand(1);
				2569
				2570	SmallVector<MVT, 4> ValueVTs;
				2571	SmallVector<uint64_t, 4> Offsets;
				2572	ComputeValueVTs(TLI, SrcV->getType(), ValueVTs, &Offsets);
				2573	unsigned NumValues = ValueVTs.size();
				2574	if (NumValues == 0)
				2575	return;
				2576
				2577	// Get the lowered operands. Note that we do this after
				2578	// checking if NumResults is zero, because with zero results
				2579	// the operands won't have values in the map.
				2580	SDValue Src = getValue(SrcV);
				2581	SDValue Ptr = getValue(PtrV);
				2582
				2583	SDValue Root = getRoot();
				2584	SmallVector<SDValue, 4> Chains(NumValues);
				2585	MVT PtrVT = Ptr.getValueType();
				2586	bool isVolatile = I.isVolatile();
				2587	unsigned Alignment = I.getAlignment();
				2588	for (unsigned i = 0; i != NumValues; ++i)
				2589	Chains[i] = DAG.getStore(Root, SDValue(Src.getNode(), Src.getResNo() + i),
				2590	DAG.getNode(ISD::ADD, PtrVT, Ptr,
				2591	DAG.getConstant(Offsets[i], PtrVT)),
				2592	PtrV, Offsets[i],
				2593	isVolatile, Alignment);
				2594
				2595	DAG.setRoot(DAG.getNode(ISD::TokenFactor, MVT::Other, &Chains[0], NumValues));
				2596	}
				2597
				2598	/// visitTargetIntrinsic - Lower a call of a target intrinsic to an INTRINSIC
				2599	/// node.
				2600	void SelectionDAGLowering::visitTargetIntrinsic(CallInst &I,
				2601	unsigned Intrinsic) {
				2602	bool HasChain = !I.doesNotAccessMemory();
				2603	bool OnlyLoad = HasChain && I.onlyReadsMemory();
				2604
				2605	// Build the operand list.
				2606	SmallVector<SDValue, 8> Ops;
				2607	if (HasChain) { // If this intrinsic has side-effects, chainify it.
				2608	if (OnlyLoad) {
				2609	// We don't need to serialize loads against other loads.
				2610	Ops.push_back(DAG.getRoot());
				2611	} else {
				2612	Ops.push_back(getRoot());
				2613	}
				2614	}
				2615
				2616	// Add the intrinsic ID as an integer operand.
				2617	Ops.push_back(DAG.getConstant(Intrinsic, TLI.getPointerTy()));
				2618
				2619	// Add all operands of the call to the operand list.
				2620	for (unsigned i = 1, e = I.getNumOperands(); i != e; ++i) {
				2621	SDValue Op = getValue(I.getOperand(i));
				2622	assert(TLI.isTypeLegal(Op.getValueType()) &&
				2623	"Intrinsic uses a non-legal type?");
				2624	Ops.push_back(Op);
				2625	}
				2626
				2627	std::vector<MVT> VTs;
				2628	if (I.getType() != Type::VoidTy) {
				2629	MVT VT = TLI.getValueType(I.getType());
				2630	if (VT.isVector()) {
				2631	const VectorType *DestTy = cast<VectorType>(I.getType());
				2632	MVT EltVT = TLI.getValueType(DestTy->getElementType());
				2633
				2634	VT = MVT::getVectorVT(EltVT, DestTy->getNumElements());
				2635	assert(VT != MVT::Other && "Intrinsic uses a non-legal type?");
				2636	}
				2637
				2638	assert(TLI.isTypeLegal(VT) && "Intrinsic uses a non-legal type?");
				2639	VTs.push_back(VT);
				2640	}
				2641	if (HasChain)
				2642	VTs.push_back(MVT::Other);
				2643
				2644	const MVT *VTList = DAG.getNodeValueTypes(VTs);
				2645
				2646	// Create the node.
				2647	SDValue Result;
				2648	if (!HasChain)
				2649	Result = DAG.getNode(ISD::INTRINSIC_WO_CHAIN, VTList, VTs.size(),
				2650	&Ops[0], Ops.size());
				2651	else if (I.getType() != Type::VoidTy)
				2652	Result = DAG.getNode(ISD::INTRINSIC_W_CHAIN, VTList, VTs.size(),
				2653	&Ops[0], Ops.size());
				2654	else
				2655	Result = DAG.getNode(ISD::INTRINSIC_VOID, VTList, VTs.size(),
				2656	&Ops[0], Ops.size());
				2657
				2658	if (HasChain) {
				2659	SDValue Chain = Result.getValue(Result.getNode()->getNumValues()-1);
				2660	if (OnlyLoad)
				2661	PendingLoads.push_back(Chain);
				2662	else
				2663	DAG.setRoot(Chain);
				2664	}
				2665	if (I.getType() != Type::VoidTy) {
				2666	if (const VectorType *PTy = dyn_cast<VectorType>(I.getType())) {
				2667	MVT VT = TLI.getValueType(PTy);
				2668	Result = DAG.getNode(ISD::BIT_CONVERT, VT, Result);
				2669	}
				2670	setValue(&I, Result);
				2671	}
				2672	}
				2673
				2674	/// ExtractTypeInfo - Returns the type info, possibly bitcast, encoded in V.
				2675	static GlobalVariable ExtractTypeInfo(Value V) {
				2676	V = V->stripPointerCasts();
				2677	GlobalVariable *GV = dyn_cast<GlobalVariable>(V);
				2678	assert ((GV \|\| isa<ConstantPointerNull>(V)) &&
				2679	"TypeInfo must be a global variable or NULL");
				2680	return GV;
				2681	}
				2682
				2683	namespace llvm {
				2684
				2685	/// AddCatchInfo - Extract the personality and type infos from an eh.selector
				2686	/// call, and add them to the specified machine basic block.
				2687	void AddCatchInfo(CallInst &I, MachineModuleInfo *MMI,
				2688	MachineBasicBlock *MBB) {
				2689	// Inform the MachineModuleInfo of the personality for this landing pad.
				2690	ConstantExpr *CE = cast<ConstantExpr>(I.getOperand(2));
				2691	assert(CE->getOpcode() == Instruction::BitCast &&
				2692	isa<Function>(CE->getOperand(0)) &&
				2693	"Personality should be a function");
				2694	MMI->addPersonality(MBB, cast<Function>(CE->getOperand(0)));
				2695
				2696	// Gather all the type infos for this landing pad and pass them along to
				2697	// MachineModuleInfo.
				2698	std::vector<GlobalVariable *> TyInfo;
				2699	unsigned N = I.getNumOperands();
				2700
				2701	for (unsigned i = N - 1; i > 2; --i) {
				2702	if (ConstantInt *CI = dyn_cast<ConstantInt>(I.getOperand(i))) {
				2703	unsigned FilterLength = CI->getZExtValue();
				2704	unsigned FirstCatch = i + FilterLength + !FilterLength;
				2705	assert (FirstCatch <= N && "Invalid filter length");
				2706
				2707	if (FirstCatch < N) {
				2708	TyInfo.reserve(N - FirstCatch);
				2709	for (unsigned j = FirstCatch; j < N; ++j)
				2710	TyInfo.push_back(ExtractTypeInfo(I.getOperand(j)));
				2711	MMI->addCatchTypeInfo(MBB, TyInfo);
				2712	TyInfo.clear();
				2713	}
				2714
				2715	if (!FilterLength) {
				2716	// Cleanup.
				2717	MMI->addCleanup(MBB);
				2718	} else {
				2719	// Filter.
				2720	TyInfo.reserve(FilterLength - 1);
				2721	for (unsigned j = i + 1; j < FirstCatch; ++j)
				2722	TyInfo.push_back(ExtractTypeInfo(I.getOperand(j)));
				2723	MMI->addFilterTypeInfo(MBB, TyInfo);
				2724	TyInfo.clear();
				2725	}
				2726
				2727	N = i;
				2728	}
				2729	}
				2730
				2731	if (N > 3) {
				2732	TyInfo.reserve(N - 3);
				2733	for (unsigned j = 3; j < N; ++j)
				2734	TyInfo.push_back(ExtractTypeInfo(I.getOperand(j)));
				2735	MMI->addCatchTypeInfo(MBB, TyInfo);
				2736	}
				2737	}
				2738
				2739	}
				2740
				2741	/// Inlined utility function to implement binary input atomic intrinsics for
				2742	/// visitIntrinsicCall: I is a call instruction
				2743	/// Op is the associated NodeType for I
				2744	const char *
				2745	SelectionDAGLowering::implVisitBinaryAtomic(CallInst& I, ISD::NodeType Op) {
				2746	SDValue Root = getRoot();
				2747	SDValue L = DAG.getAtomic(Op, Root,
				2748	getValue(I.getOperand(1)),
				2749	getValue(I.getOperand(2)),
				2750	I.getOperand(1));
				2751	setValue(&I, L);
				2752	DAG.setRoot(L.getValue(1));
				2753	return 0;
				2754	}
				2755
Dale Johannesen	59e577f	2008-09-05 18:38:42 +0000	[diff] [blame^]	2756	/// visitExp - lower an exp intrinsic. Handles the special sequences
				2757	/// for limited-precision mode.
				2758
				2759	void
				2760	SelectionDAGLowering::visitExp(CallInst &I) {
				2761	SDValue result;
				2762	// No special expansion.
				2763	result = DAG.getNode(ISD::FEXP,
				2764	getValue(I.getOperand(1)).getValueType(),
				2765	getValue(I.getOperand(1)));
				2766	setValue(&I, result);
				2767	}
				2768
				2769	/// visitLog - lower a log intrinsic. Handles the special sequences
				2770	/// for limited-precision mode.
				2771
				2772	void
				2773	SelectionDAGLowering::visitLog(CallInst &I) {
				2774	SDValue result;
				2775	// No special expansion.
				2776	result = DAG.getNode(ISD::FLOG,
				2777	getValue(I.getOperand(1)).getValueType(),
				2778	getValue(I.getOperand(1)));
				2779	setValue(&I, result);
				2780	}
				2781
				2782	/// visitLog2 - lower a log2 intrinsic. Handles the special sequences
				2783	/// for limited-precision mode.
				2784
				2785	void
				2786	SelectionDAGLowering::visitLog2(CallInst &I) {
				2787	SDValue result;
				2788	// No special expansion.
				2789	result = DAG.getNode(ISD::FLOG2,
				2790	getValue(I.getOperand(1)).getValueType(),
				2791	getValue(I.getOperand(1)));
				2792	setValue(&I, result);
				2793	}
				2794
				2795	/// visitLog10 - lower a log10 intrinsic. Handles the special sequences
				2796	/// for limited-precision mode.
				2797
				2798	void
				2799	SelectionDAGLowering::visitLog10(CallInst &I) {
				2800	SDValue result;
				2801	// No special expansion.
				2802	result = DAG.getNode(ISD::FLOG10,
				2803	getValue(I.getOperand(1)).getValueType(),
				2804	getValue(I.getOperand(1)));
				2805	setValue(&I, result);
				2806	}
				2807
Dale Johannesen	601d3c0	2008-09-05 01:48:15 +0000	[diff] [blame]	2808	/// visitExp2 - lower an exp2 intrinsic. Handles the special sequences
				2809	/// for limited-precision mode.
				2810
				2811	void
				2812	SelectionDAGLowering::visitExp2(CallInst &I) {
				2813	SDValue result;
				2814	if (getValue(I.getOperand(1)).getValueType() == MVT::f32 &&
				2815	LimitFloatPrecision>0 && LimitFloatPrecision<=12) {
				2816	SDValue operand = getValue(I.getOperand(1));
				2817	SDValue t0 = DAG.getNode(ISD::FP_TO_SINT, MVT::i32, operand);
				2818	SDValue t1 = DAG.getNode(ISD::SINT_TO_FP, MVT::f32, t0);
				2819	SDValue t2 = DAG.getNode(ISD::FSUB, MVT::f32, operand, t1);
				2820	SDValue t3 = DAG.getNode(ISD::SHL, MVT::i32, t0,
				2821	DAG.getConstant(23, MVT::i32));
				2822	SDValue t4 = DAG.getNode(ISD::FP_EXTEND, MVT::f64, t2);
				2823	SDValue t5 = DAG.getNode(ISD::FMUL, MVT::f64, t4,
				2824	DAG.getConstantFP(APFloat(
				2825	APInt(64, 0x3fb446bc609aa9cdULL)), MVT::f64));
				2826	SDValue t6 = DAG.getNode(ISD::FADD, MVT::f64, t5,
				2827	DAG.getConstantFP(APFloat(
				2828	APInt(64, 0x3fccb71e629f3a20ULL)), MVT::f64));
				2829	SDValue t7 = DAG.getNode(ISD::FMUL, MVT::f64, t6, t4);
				2830	SDValue t8 = DAG.getNode(ISD::FADD, MVT::f64, t7,
				2831	DAG.getConstantFP(APFloat(
				2832	APInt(64, 0x3fe64960db7bd5feULL)), MVT::f64));
				2833	SDValue t9 = DAG.getNode(ISD::FMUL, MVT::f64, t8, t4);
				2834	SDValue t10 = DAG.getNode(ISD::FADD, MVT::f64, t9,
				2835	DAG.getConstantFP(APFloat(
				2836	APInt(64, 0x3fefff1f934bd549ULL)), MVT::f64));
				2837	SDValue t11 = DAG.getNode(ISD::FP_ROUND, MVT::f32, t10,
				2838	DAG.getConstant(0, MVT::i32));
				2839	SDValue t12 = DAG.getNode(ISD::BIT_CONVERT, MVT::i32, t11);
				2840	SDValue t13 = DAG.getNode(ISD::ADD, MVT::i32, t12, t3);
				2841	result = DAG.getNode(ISD::BIT_CONVERT, MVT::f32, t13);
				2842	} else {
				2843	// No special expansion.
				2844	result = DAG.getNode(ISD::FEXP2,
				2845	getValue(I.getOperand(1)).getValueType(),
				2846	getValue(I.getOperand(1)));
				2847	}
				2848	setValue(&I, result);
				2849	}
				2850
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	2851	/// visitIntrinsicCall - Lower the call to the specified intrinsic function. If
				2852	/// we want to emit this as a call to a named external function, return the name
				2853	/// otherwise lower it and return null.
				2854	const char *
				2855	SelectionDAGLowering::visitIntrinsicCall(CallInst &I, unsigned Intrinsic) {
				2856	switch (Intrinsic) {
				2857	default:
				2858	// By default, turn this into a target intrinsic node.
				2859	visitTargetIntrinsic(I, Intrinsic);
				2860	return 0;
				2861	case Intrinsic::vastart: visitVAStart(I); return 0;
				2862	case Intrinsic::vaend: visitVAEnd(I); return 0;
				2863	case Intrinsic::vacopy: visitVACopy(I); return 0;
				2864	case Intrinsic::returnaddress:
				2865	setValue(&I, DAG.getNode(ISD::RETURNADDR, TLI.getPointerTy(),
				2866	getValue(I.getOperand(1))));
				2867	return 0;
				2868	case Intrinsic::frameaddress:
				2869	setValue(&I, DAG.getNode(ISD::FRAMEADDR, TLI.getPointerTy(),
				2870	getValue(I.getOperand(1))));
				2871	return 0;
				2872	case Intrinsic::setjmp:
				2873	return "_setjmp"+!TLI.usesUnderscoreSetJmp();
				2874	break;
				2875	case Intrinsic::longjmp:
				2876	return "_longjmp"+!TLI.usesUnderscoreLongJmp();
				2877	break;
				2878	case Intrinsic::memcpy_i32:
				2879	case Intrinsic::memcpy_i64: {
				2880	SDValue Op1 = getValue(I.getOperand(1));
				2881	SDValue Op2 = getValue(I.getOperand(2));
				2882	SDValue Op3 = getValue(I.getOperand(3));
				2883	unsigned Align = cast<ConstantInt>(I.getOperand(4))->getZExtValue();
				2884	DAG.setRoot(DAG.getMemcpy(getRoot(), Op1, Op2, Op3, Align, false,
				2885	I.getOperand(1), 0, I.getOperand(2), 0));
				2886	return 0;
				2887	}
				2888	case Intrinsic::memset_i32:
				2889	case Intrinsic::memset_i64: {
				2890	SDValue Op1 = getValue(I.getOperand(1));
				2891	SDValue Op2 = getValue(I.getOperand(2));
				2892	SDValue Op3 = getValue(I.getOperand(3));
				2893	unsigned Align = cast<ConstantInt>(I.getOperand(4))->getZExtValue();
				2894	DAG.setRoot(DAG.getMemset(getRoot(), Op1, Op2, Op3, Align,
				2895	I.getOperand(1), 0));
				2896	return 0;
				2897	}
				2898	case Intrinsic::memmove_i32:
				2899	case Intrinsic::memmove_i64: {
				2900	SDValue Op1 = getValue(I.getOperand(1));
				2901	SDValue Op2 = getValue(I.getOperand(2));
				2902	SDValue Op3 = getValue(I.getOperand(3));
				2903	unsigned Align = cast<ConstantInt>(I.getOperand(4))->getZExtValue();
				2904
				2905	// If the source and destination are known to not be aliases, we can
				2906	// lower memmove as memcpy.
				2907	uint64_t Size = -1ULL;
				2908	if (ConstantSDNode *C = dyn_cast<ConstantSDNode>(Op3))
				2909	Size = C->getValue();
				2910	if (AA->alias(I.getOperand(1), Size, I.getOperand(2), Size) ==
				2911	AliasAnalysis::NoAlias) {
				2912	DAG.setRoot(DAG.getMemcpy(getRoot(), Op1, Op2, Op3, Align, false,
				2913	I.getOperand(1), 0, I.getOperand(2), 0));
				2914	return 0;
				2915	}
				2916
				2917	DAG.setRoot(DAG.getMemmove(getRoot(), Op1, Op2, Op3, Align,
				2918	I.getOperand(1), 0, I.getOperand(2), 0));
				2919	return 0;
				2920	}
				2921	case Intrinsic::dbg_stoppoint: {
				2922	MachineModuleInfo *MMI = DAG.getMachineModuleInfo();
				2923	DbgStopPointInst &SPI = cast<DbgStopPointInst>(I);
				2924	if (MMI && SPI.getContext() && MMI->Verify(SPI.getContext())) {
				2925	DebugInfoDesc *DD = MMI->getDescFor(SPI.getContext());
				2926	assert(DD && "Not a debug information descriptor");
				2927	DAG.setRoot(DAG.getDbgStopPoint(getRoot(),
				2928	SPI.getLine(),
				2929	SPI.getColumn(),
				2930	cast<CompileUnitDesc>(DD)));
				2931	}
				2932
				2933	return 0;
				2934	}
				2935	case Intrinsic::dbg_region_start: {
				2936	MachineModuleInfo *MMI = DAG.getMachineModuleInfo();
				2937	DbgRegionStartInst &RSI = cast<DbgRegionStartInst>(I);
				2938	if (MMI && RSI.getContext() && MMI->Verify(RSI.getContext())) {
				2939	unsigned LabelID = MMI->RecordRegionStart(RSI.getContext());
				2940	DAG.setRoot(DAG.getLabel(ISD::DBG_LABEL, getRoot(), LabelID));
				2941	}
				2942
				2943	return 0;
				2944	}
				2945	case Intrinsic::dbg_region_end: {
				2946	MachineModuleInfo *MMI = DAG.getMachineModuleInfo();
				2947	DbgRegionEndInst &REI = cast<DbgRegionEndInst>(I);
				2948	if (MMI && REI.getContext() && MMI->Verify(REI.getContext())) {
				2949	unsigned LabelID = MMI->RecordRegionEnd(REI.getContext());
				2950	DAG.setRoot(DAG.getLabel(ISD::DBG_LABEL, getRoot(), LabelID));
				2951	}
				2952
				2953	return 0;
				2954	}
				2955	case Intrinsic::dbg_func_start: {
				2956	MachineModuleInfo *MMI = DAG.getMachineModuleInfo();
				2957	if (!MMI) return 0;
				2958	DbgFuncStartInst &FSI = cast<DbgFuncStartInst>(I);
				2959	Value *SP = FSI.getSubprogram();
				2960	if (SP && MMI->Verify(SP)) {
				2961	// llvm.dbg.func.start implicitly defines a dbg_stoppoint which is
				2962	// what (most?) gdb expects.
				2963	DebugInfoDesc *DD = MMI->getDescFor(SP);
				2964	assert(DD && "Not a debug information descriptor");
				2965	SubprogramDesc *Subprogram = cast<SubprogramDesc>(DD);
				2966	const CompileUnitDesc *CompileUnit = Subprogram->getFile();
				2967	unsigned SrcFile = MMI->RecordSource(CompileUnit);
				2968	// Record the source line but does create a label. It will be emitted
				2969	// at asm emission time.
				2970	MMI->RecordSourceLine(Subprogram->getLine(), 0, SrcFile);
				2971	}
				2972
				2973	return 0;
				2974	}
				2975	case Intrinsic::dbg_declare: {
				2976	MachineModuleInfo *MMI = DAG.getMachineModuleInfo();
				2977	DbgDeclareInst &DI = cast<DbgDeclareInst>(I);
				2978	Value *Variable = DI.getVariable();
				2979	if (MMI && Variable && MMI->Verify(Variable))
				2980	DAG.setRoot(DAG.getNode(ISD::DECLARE, MVT::Other, getRoot(),
				2981	getValue(DI.getAddress()), getValue(Variable)));
				2982	return 0;
				2983	}
				2984
				2985	case Intrinsic::eh_exception: {
				2986	if (!CurMBB->isLandingPad()) {
				2987	// FIXME: Mark exception register as live in. Hack for PR1508.
				2988	unsigned Reg = TLI.getExceptionAddressRegister();
				2989	if (Reg) CurMBB->addLiveIn(Reg);
				2990	}
				2991	// Insert the EXCEPTIONADDR instruction.
				2992	SDVTList VTs = DAG.getVTList(TLI.getPointerTy(), MVT::Other);
				2993	SDValue Ops[1];
				2994	Ops[0] = DAG.getRoot();
				2995	SDValue Op = DAG.getNode(ISD::EXCEPTIONADDR, VTs, Ops, 1);
				2996	setValue(&I, Op);
				2997	DAG.setRoot(Op.getValue(1));
				2998	return 0;
				2999	}
				3000
				3001	case Intrinsic::eh_selector_i32:
				3002	case Intrinsic::eh_selector_i64: {
				3003	MachineModuleInfo *MMI = DAG.getMachineModuleInfo();
				3004	MVT VT = (Intrinsic == Intrinsic::eh_selector_i32 ?
				3005	MVT::i32 : MVT::i64);
				3006
				3007	if (MMI) {
				3008	if (CurMBB->isLandingPad())
				3009	AddCatchInfo(I, MMI, CurMBB);
				3010	else {
				3011	#ifndef NDEBUG
				3012	FuncInfo.CatchInfoLost.insert(&I);
				3013	#endif
				3014	// FIXME: Mark exception selector register as live in. Hack for PR1508.
				3015	unsigned Reg = TLI.getExceptionSelectorRegister();
				3016	if (Reg) CurMBB->addLiveIn(Reg);
				3017	}
				3018
				3019	// Insert the EHSELECTION instruction.
				3020	SDVTList VTs = DAG.getVTList(VT, MVT::Other);
				3021	SDValue Ops[2];
				3022	Ops[0] = getValue(I.getOperand(1));
				3023	Ops[1] = getRoot();
				3024	SDValue Op = DAG.getNode(ISD::EHSELECTION, VTs, Ops, 2);
				3025	setValue(&I, Op);
				3026	DAG.setRoot(Op.getValue(1));
				3027	} else {
				3028	setValue(&I, DAG.getConstant(0, VT));
				3029	}
				3030
				3031	return 0;
				3032	}
				3033
				3034	case Intrinsic::eh_typeid_for_i32:
				3035	case Intrinsic::eh_typeid_for_i64: {
				3036	MachineModuleInfo *MMI = DAG.getMachineModuleInfo();
				3037	MVT VT = (Intrinsic == Intrinsic::eh_typeid_for_i32 ?
				3038	MVT::i32 : MVT::i64);
				3039
				3040	if (MMI) {
				3041	// Find the type id for the given typeinfo.
				3042	GlobalVariable *GV = ExtractTypeInfo(I.getOperand(1));
				3043
				3044	unsigned TypeID = MMI->getTypeIDFor(GV);
				3045	setValue(&I, DAG.getConstant(TypeID, VT));
				3046	} else {
				3047	// Return something different to eh_selector.
				3048	setValue(&I, DAG.getConstant(1, VT));
				3049	}
				3050
				3051	return 0;
				3052	}
				3053
				3054	case Intrinsic::eh_return: {
				3055	MachineModuleInfo *MMI = DAG.getMachineModuleInfo();
				3056
				3057	if (MMI) {
				3058	MMI->setCallsEHReturn(true);
				3059	DAG.setRoot(DAG.getNode(ISD::EH_RETURN,
				3060	MVT::Other,
				3061	getControlRoot(),
				3062	getValue(I.getOperand(1)),
				3063	getValue(I.getOperand(2))));
				3064	} else {
				3065	setValue(&I, DAG.getConstant(0, TLI.getPointerTy()));
				3066	}
				3067
				3068	return 0;
				3069	}
				3070
				3071	case Intrinsic::eh_unwind_init: {
				3072	if (MachineModuleInfo *MMI = DAG.getMachineModuleInfo()) {
				3073	MMI->setCallsUnwindInit(true);
				3074	}
				3075
				3076	return 0;
				3077	}
				3078
				3079	case Intrinsic::eh_dwarf_cfa: {
				3080	MVT VT = getValue(I.getOperand(1)).getValueType();
				3081	SDValue CfaArg;
				3082	if (VT.bitsGT(TLI.getPointerTy()))
				3083	CfaArg = DAG.getNode(ISD::TRUNCATE,
				3084	TLI.getPointerTy(), getValue(I.getOperand(1)));
				3085	else
				3086	CfaArg = DAG.getNode(ISD::SIGN_EXTEND,
				3087	TLI.getPointerTy(), getValue(I.getOperand(1)));
				3088
				3089	SDValue Offset = DAG.getNode(ISD::ADD,
				3090	TLI.getPointerTy(),
				3091	DAG.getNode(ISD::FRAME_TO_ARGS_OFFSET,
				3092	TLI.getPointerTy()),
				3093	CfaArg);
				3094	setValue(&I, DAG.getNode(ISD::ADD,
				3095	TLI.getPointerTy(),
				3096	DAG.getNode(ISD::FRAMEADDR,
				3097	TLI.getPointerTy(),
				3098	DAG.getConstant(0,
				3099	TLI.getPointerTy())),
				3100	Offset));
				3101	return 0;
				3102	}
				3103
				3104	case Intrinsic::sqrt:
				3105	setValue(&I, DAG.getNode(ISD::FSQRT,
				3106	getValue(I.getOperand(1)).getValueType(),
				3107	getValue(I.getOperand(1))));
				3108	return 0;
				3109	case Intrinsic::powi:
				3110	setValue(&I, DAG.getNode(ISD::FPOWI,
				3111	getValue(I.getOperand(1)).getValueType(),
				3112	getValue(I.getOperand(1)),
				3113	getValue(I.getOperand(2))));
				3114	return 0;
				3115	case Intrinsic::sin:
				3116	setValue(&I, DAG.getNode(ISD::FSIN,
				3117	getValue(I.getOperand(1)).getValueType(),
				3118	getValue(I.getOperand(1))));
				3119	return 0;
				3120	case Intrinsic::cos:
				3121	setValue(&I, DAG.getNode(ISD::FCOS,
				3122	getValue(I.getOperand(1)).getValueType(),
				3123	getValue(I.getOperand(1))));
				3124	return 0;
Dale Johannesen	7794f2a	2008-09-04 00:47:13 +0000	[diff] [blame]	3125	case Intrinsic::log:
Dale Johannesen	59e577f	2008-09-05 18:38:42 +0000	[diff] [blame^]	3126	visitLog(I);
Dale Johannesen	7794f2a	2008-09-04 00:47:13 +0000	[diff] [blame]	3127	return 0;
				3128	case Intrinsic::log2:
Dale Johannesen	59e577f	2008-09-05 18:38:42 +0000	[diff] [blame^]	3129	visitLog2(I);
Dale Johannesen	7794f2a	2008-09-04 00:47:13 +0000	[diff] [blame]	3130	return 0;
				3131	case Intrinsic::log10:
Dale Johannesen	59e577f	2008-09-05 18:38:42 +0000	[diff] [blame^]	3132	visitLog10(I);
Dale Johannesen	7794f2a	2008-09-04 00:47:13 +0000	[diff] [blame]	3133	return 0;
				3134	case Intrinsic::exp:
Dale Johannesen	59e577f	2008-09-05 18:38:42 +0000	[diff] [blame^]	3135	visitExp(I);
Dale Johannesen	7794f2a	2008-09-04 00:47:13 +0000	[diff] [blame]	3136	return 0;
				3137	case Intrinsic::exp2:
Dale Johannesen	601d3c0	2008-09-05 01:48:15 +0000	[diff] [blame]	3138	visitExp2(I);
Dale Johannesen	7794f2a	2008-09-04 00:47:13 +0000	[diff] [blame]	3139	return 0;
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	3140	case Intrinsic::pow:
				3141	setValue(&I, DAG.getNode(ISD::FPOW,
				3142	getValue(I.getOperand(1)).getValueType(),
				3143	getValue(I.getOperand(1)),
				3144	getValue(I.getOperand(2))));
				3145	return 0;
				3146	case Intrinsic::pcmarker: {
				3147	SDValue Tmp = getValue(I.getOperand(1));
				3148	DAG.setRoot(DAG.getNode(ISD::PCMARKER, MVT::Other, getRoot(), Tmp));
				3149	return 0;
				3150	}
				3151	case Intrinsic::readcyclecounter: {
				3152	SDValue Op = getRoot();
				3153	SDValue Tmp = DAG.getNode(ISD::READCYCLECOUNTER,
				3154	DAG.getNodeValueTypes(MVT::i64, MVT::Other), 2,
				3155	&Op, 1);
				3156	setValue(&I, Tmp);
				3157	DAG.setRoot(Tmp.getValue(1));
				3158	return 0;
				3159	}
				3160	case Intrinsic::part_select: {
				3161	// Currently not implemented: just abort
				3162	assert(0 && "part_select intrinsic not implemented");
				3163	abort();
				3164	}
				3165	case Intrinsic::part_set: {
				3166	// Currently not implemented: just abort
				3167	assert(0 && "part_set intrinsic not implemented");
				3168	abort();
				3169	}
				3170	case Intrinsic::bswap:
				3171	setValue(&I, DAG.getNode(ISD::BSWAP,
				3172	getValue(I.getOperand(1)).getValueType(),
				3173	getValue(I.getOperand(1))));
				3174	return 0;
				3175	case Intrinsic::cttz: {
				3176	SDValue Arg = getValue(I.getOperand(1));
				3177	MVT Ty = Arg.getValueType();
				3178	SDValue result = DAG.getNode(ISD::CTTZ, Ty, Arg);
				3179	setValue(&I, result);
				3180	return 0;
				3181	}
				3182	case Intrinsic::ctlz: {
				3183	SDValue Arg = getValue(I.getOperand(1));
				3184	MVT Ty = Arg.getValueType();
				3185	SDValue result = DAG.getNode(ISD::CTLZ, Ty, Arg);
				3186	setValue(&I, result);
				3187	return 0;
				3188	}
				3189	case Intrinsic::ctpop: {
				3190	SDValue Arg = getValue(I.getOperand(1));
				3191	MVT Ty = Arg.getValueType();
				3192	SDValue result = DAG.getNode(ISD::CTPOP, Ty, Arg);
				3193	setValue(&I, result);
				3194	return 0;
				3195	}
				3196	case Intrinsic::stacksave: {
				3197	SDValue Op = getRoot();
				3198	SDValue Tmp = DAG.getNode(ISD::STACKSAVE,
				3199	DAG.getNodeValueTypes(TLI.getPointerTy(), MVT::Other), 2, &Op, 1);
				3200	setValue(&I, Tmp);
				3201	DAG.setRoot(Tmp.getValue(1));
				3202	return 0;
				3203	}
				3204	case Intrinsic::stackrestore: {
				3205	SDValue Tmp = getValue(I.getOperand(1));
				3206	DAG.setRoot(DAG.getNode(ISD::STACKRESTORE, MVT::Other, getRoot(), Tmp));
				3207	return 0;
				3208	}
				3209	case Intrinsic::var_annotation:
				3210	// Discard annotate attributes
				3211	return 0;
				3212
				3213	case Intrinsic::init_trampoline: {
				3214	const Function *F = cast<Function>(I.getOperand(2)->stripPointerCasts());
				3215
				3216	SDValue Ops[6];
				3217	Ops[0] = getRoot();
				3218	Ops[1] = getValue(I.getOperand(1));
				3219	Ops[2] = getValue(I.getOperand(2));
				3220	Ops[3] = getValue(I.getOperand(3));
				3221	Ops[4] = DAG.getSrcValue(I.getOperand(1));
				3222	Ops[5] = DAG.getSrcValue(F);
				3223
				3224	SDValue Tmp = DAG.getNode(ISD::TRAMPOLINE,
				3225	DAG.getNodeValueTypes(TLI.getPointerTy(),
				3226	MVT::Other), 2,
				3227	Ops, 6);
				3228
				3229	setValue(&I, Tmp);
				3230	DAG.setRoot(Tmp.getValue(1));
				3231	return 0;
				3232	}
				3233
				3234	case Intrinsic::gcroot:
				3235	if (GFI) {
				3236	Value *Alloca = I.getOperand(1);
				3237	Constant *TypeMap = cast<Constant>(I.getOperand(2));
				3238
				3239	FrameIndexSDNode *FI = cast<FrameIndexSDNode>(getValue(Alloca).getNode());
				3240	GFI->addStackRoot(FI->getIndex(), TypeMap);
				3241	}
				3242	return 0;
				3243
				3244	case Intrinsic::gcread:
				3245	case Intrinsic::gcwrite:
				3246	assert(0 && "GC failed to lower gcread/gcwrite intrinsics!");
				3247	return 0;
				3248
				3249	case Intrinsic::flt_rounds: {
				3250	setValue(&I, DAG.getNode(ISD::FLT_ROUNDS_, MVT::i32));
				3251	return 0;
				3252	}
				3253
				3254	case Intrinsic::trap: {
				3255	DAG.setRoot(DAG.getNode(ISD::TRAP, MVT::Other, getRoot()));
				3256	return 0;
				3257	}
				3258	case Intrinsic::prefetch: {
				3259	SDValue Ops[4];
				3260	Ops[0] = getRoot();
				3261	Ops[1] = getValue(I.getOperand(1));
				3262	Ops[2] = getValue(I.getOperand(2));
				3263	Ops[3] = getValue(I.getOperand(3));
				3264	DAG.setRoot(DAG.getNode(ISD::PREFETCH, MVT::Other, &Ops[0], 4));
				3265	return 0;
				3266	}
				3267
				3268	case Intrinsic::memory_barrier: {
				3269	SDValue Ops[6];
				3270	Ops[0] = getRoot();
				3271	for (int x = 1; x < 6; ++x)
				3272	Ops[x] = getValue(I.getOperand(x));
				3273
				3274	DAG.setRoot(DAG.getNode(ISD::MEMBARRIER, MVT::Other, &Ops[0], 6));
				3275	return 0;
				3276	}
				3277	case Intrinsic::atomic_cmp_swap: {
				3278	SDValue Root = getRoot();
				3279	SDValue L;
				3280	switch (getValue(I.getOperand(2)).getValueType().getSimpleVT()) {
				3281	case MVT::i8:
				3282	L = DAG.getAtomic(ISD::ATOMIC_CMP_SWAP_8, Root,
				3283	getValue(I.getOperand(1)),
				3284	getValue(I.getOperand(2)),
				3285	getValue(I.getOperand(3)),
				3286	I.getOperand(1));
				3287	break;
				3288	case MVT::i16:
				3289	L = DAG.getAtomic(ISD::ATOMIC_CMP_SWAP_16, Root,
				3290	getValue(I.getOperand(1)),
				3291	getValue(I.getOperand(2)),
				3292	getValue(I.getOperand(3)),
				3293	I.getOperand(1));
				3294	break;
				3295	case MVT::i32:
				3296	L = DAG.getAtomic(ISD::ATOMIC_CMP_SWAP_32, Root,
				3297	getValue(I.getOperand(1)),
				3298	getValue(I.getOperand(2)),
				3299	getValue(I.getOperand(3)),
				3300	I.getOperand(1));
				3301	break;
				3302	case MVT::i64:
				3303	L = DAG.getAtomic(ISD::ATOMIC_CMP_SWAP_64, Root,
				3304	getValue(I.getOperand(1)),
				3305	getValue(I.getOperand(2)),
				3306	getValue(I.getOperand(3)),
				3307	I.getOperand(1));
				3308	break;
				3309	default:
				3310	assert(0 && "Invalid atomic type");
				3311	abort();
				3312	}
				3313	setValue(&I, L);
				3314	DAG.setRoot(L.getValue(1));
				3315	return 0;
				3316	}
				3317	case Intrinsic::atomic_load_add:
				3318	switch (getValue(I.getOperand(2)).getValueType().getSimpleVT()) {
				3319	case MVT::i8:
				3320	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_ADD_8);
				3321	case MVT::i16:
				3322	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_ADD_16);
				3323	case MVT::i32:
				3324	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_ADD_32);
				3325	case MVT::i64:
				3326	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_ADD_64);
				3327	default:
				3328	assert(0 && "Invalid atomic type");
				3329	abort();
				3330	}
				3331	case Intrinsic::atomic_load_sub:
				3332	switch (getValue(I.getOperand(2)).getValueType().getSimpleVT()) {
				3333	case MVT::i8:
				3334	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_SUB_8);
				3335	case MVT::i16:
				3336	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_SUB_16);
				3337	case MVT::i32:
				3338	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_SUB_32);
				3339	case MVT::i64:
				3340	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_SUB_64);
				3341	default:
				3342	assert(0 && "Invalid atomic type");
				3343	abort();
				3344	}
				3345	case Intrinsic::atomic_load_or:
				3346	switch (getValue(I.getOperand(2)).getValueType().getSimpleVT()) {
				3347	case MVT::i8:
				3348	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_OR_8);
				3349	case MVT::i16:
				3350	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_OR_16);
				3351	case MVT::i32:
				3352	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_OR_32);
				3353	case MVT::i64:
				3354	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_OR_64);
				3355	default:
				3356	assert(0 && "Invalid atomic type");
				3357	abort();
				3358	}
				3359	case Intrinsic::atomic_load_xor:
				3360	switch (getValue(I.getOperand(2)).getValueType().getSimpleVT()) {
				3361	case MVT::i8:
				3362	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_XOR_8);
				3363	case MVT::i16:
				3364	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_XOR_16);
				3365	case MVT::i32:
				3366	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_XOR_32);
				3367	case MVT::i64:
				3368	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_XOR_64);
				3369	default:
				3370	assert(0 && "Invalid atomic type");
				3371	abort();
				3372	}
				3373	case Intrinsic::atomic_load_and:
				3374	switch (getValue(I.getOperand(2)).getValueType().getSimpleVT()) {
				3375	case MVT::i8:
				3376	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_AND_8);
				3377	case MVT::i16:
				3378	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_AND_16);
				3379	case MVT::i32:
				3380	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_AND_32);
				3381	case MVT::i64:
				3382	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_AND_64);
				3383	default:
				3384	assert(0 && "Invalid atomic type");
				3385	abort();
				3386	}
				3387	case Intrinsic::atomic_load_nand:
				3388	switch (getValue(I.getOperand(2)).getValueType().getSimpleVT()) {
				3389	case MVT::i8:
				3390	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_NAND_8);
				3391	case MVT::i16:
				3392	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_NAND_16);
				3393	case MVT::i32:
				3394	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_NAND_32);
				3395	case MVT::i64:
				3396	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_NAND_64);
				3397	default:
				3398	assert(0 && "Invalid atomic type");
				3399	abort();
				3400	}
				3401	case Intrinsic::atomic_load_max:
				3402	switch (getValue(I.getOperand(2)).getValueType().getSimpleVT()) {
				3403	case MVT::i8:
				3404	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_MAX_8);
				3405	case MVT::i16:
				3406	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_MAX_16);
				3407	case MVT::i32:
				3408	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_MAX_32);
				3409	case MVT::i64:
				3410	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_MAX_64);
				3411	default:
				3412	assert(0 && "Invalid atomic type");
				3413	abort();
				3414	}
				3415	case Intrinsic::atomic_load_min:
				3416	switch (getValue(I.getOperand(2)).getValueType().getSimpleVT()) {
				3417	case MVT::i8:
				3418	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_MIN_8);
				3419	case MVT::i16:
				3420	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_MIN_16);
				3421	case MVT::i32:
				3422	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_MIN_32);
				3423	case MVT::i64:
				3424	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_MIN_64);
				3425	default:
				3426	assert(0 && "Invalid atomic type");
				3427	abort();
				3428	}
				3429	case Intrinsic::atomic_load_umin:
				3430	switch (getValue(I.getOperand(2)).getValueType().getSimpleVT()) {
				3431	case MVT::i8:
				3432	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_UMIN_8);
				3433	case MVT::i16:
				3434	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_UMIN_16);
				3435	case MVT::i32:
				3436	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_UMIN_32);
				3437	case MVT::i64:
				3438	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_UMIN_64);
				3439	default:
				3440	assert(0 && "Invalid atomic type");
				3441	abort();
				3442	}
				3443	case Intrinsic::atomic_load_umax:
				3444	switch (getValue(I.getOperand(2)).getValueType().getSimpleVT()) {
				3445	case MVT::i8:
				3446	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_UMAX_8);
				3447	case MVT::i16:
				3448	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_UMAX_16);
				3449	case MVT::i32:
				3450	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_UMAX_32);
				3451	case MVT::i64:
				3452	return implVisitBinaryAtomic(I, ISD::ATOMIC_LOAD_UMAX_64);
				3453	default:
				3454	assert(0 && "Invalid atomic type");
				3455	abort();
				3456	}
				3457	case Intrinsic::atomic_swap:
				3458	switch (getValue(I.getOperand(2)).getValueType().getSimpleVT()) {
				3459	case MVT::i8:
				3460	return implVisitBinaryAtomic(I, ISD::ATOMIC_SWAP_8);
				3461	case MVT::i16:
				3462	return implVisitBinaryAtomic(I, ISD::ATOMIC_SWAP_16);
				3463	case MVT::i32:
				3464	return implVisitBinaryAtomic(I, ISD::ATOMIC_SWAP_32);
				3465	case MVT::i64:
				3466	return implVisitBinaryAtomic(I, ISD::ATOMIC_SWAP_64);
				3467	default:
				3468	assert(0 && "Invalid atomic type");
				3469	abort();
				3470	}
				3471	}
				3472	}
				3473
				3474
				3475	void SelectionDAGLowering::LowerCallTo(CallSite CS, SDValue Callee,
				3476	bool IsTailCall,
				3477	MachineBasicBlock *LandingPad) {
				3478	const PointerType *PT = cast<PointerType>(CS.getCalledValue()->getType());
				3479	const FunctionType *FTy = cast<FunctionType>(PT->getElementType());
				3480	MachineModuleInfo *MMI = DAG.getMachineModuleInfo();
				3481	unsigned BeginLabel = 0, EndLabel = 0;
				3482
				3483	TargetLowering::ArgListTy Args;
				3484	TargetLowering::ArgListEntry Entry;
				3485	Args.reserve(CS.arg_size());
				3486	for (CallSite::arg_iterator i = CS.arg_begin(), e = CS.arg_end();
				3487	i != e; ++i) {
				3488	SDValue ArgNode = getValue(*i);
				3489	Entry.Node = ArgNode; Entry.Ty = (*i)->getType();
				3490
				3491	unsigned attrInd = i - CS.arg_begin() + 1;
				3492	Entry.isSExt = CS.paramHasAttr(attrInd, ParamAttr::SExt);
				3493	Entry.isZExt = CS.paramHasAttr(attrInd, ParamAttr::ZExt);
				3494	Entry.isInReg = CS.paramHasAttr(attrInd, ParamAttr::InReg);
				3495	Entry.isSRet = CS.paramHasAttr(attrInd, ParamAttr::StructRet);
				3496	Entry.isNest = CS.paramHasAttr(attrInd, ParamAttr::Nest);
				3497	Entry.isByVal = CS.paramHasAttr(attrInd, ParamAttr::ByVal);
				3498	Entry.Alignment = CS.getParamAlignment(attrInd);
				3499	Args.push_back(Entry);
				3500	}
				3501
				3502	if (LandingPad && MMI) {
				3503	// Insert a label before the invoke call to mark the try range. This can be
				3504	// used to detect deletion of the invoke via the MachineModuleInfo.
				3505	BeginLabel = MMI->NextLabelID();
				3506	// Both PendingLoads and PendingExports must be flushed here;
				3507	// this call might not return.
				3508	(void)getRoot();
				3509	DAG.setRoot(DAG.getLabel(ISD::EH_LABEL, getControlRoot(), BeginLabel));
				3510	}
				3511
				3512	std::pair<SDValue,SDValue> Result =
				3513	TLI.LowerCallTo(getRoot(), CS.getType(),
				3514	CS.paramHasAttr(0, ParamAttr::SExt),
				3515	CS.paramHasAttr(0, ParamAttr::ZExt),
				3516	FTy->isVarArg(), CS.getCallingConv(), IsTailCall,
				3517	Callee, Args, DAG);
				3518	if (CS.getType() != Type::VoidTy)
				3519	setValue(CS.getInstruction(), Result.first);
				3520	DAG.setRoot(Result.second);
				3521
				3522	if (LandingPad && MMI) {
				3523	// Insert a label at the end of the invoke call to mark the try range. This
				3524	// can be used to detect deletion of the invoke via the MachineModuleInfo.
				3525	EndLabel = MMI->NextLabelID();
				3526	DAG.setRoot(DAG.getLabel(ISD::EH_LABEL, getRoot(), EndLabel));
				3527
				3528	// Inform MachineModuleInfo of range.
				3529	MMI->addInvoke(LandingPad, BeginLabel, EndLabel);
				3530	}
				3531	}
				3532
				3533
				3534	void SelectionDAGLowering::visitCall(CallInst &I) {
				3535	const char *RenameFn = 0;
				3536	if (Function *F = I.getCalledFunction()) {
				3537	if (F->isDeclaration()) {
				3538	if (unsigned IID = F->getIntrinsicID()) {
				3539	RenameFn = visitIntrinsicCall(I, IID);
				3540	if (!RenameFn)
				3541	return;
				3542	}
				3543	}
				3544
				3545	// Check for well-known libc/libm calls. If the function is internal, it
				3546	// can't be a library call.
				3547	unsigned NameLen = F->getNameLen();
				3548	if (!F->hasInternalLinkage() && NameLen) {
				3549	const char *NameStr = F->getNameStart();
				3550	if (NameStr[0] == 'c' &&
				3551	((NameLen == 8 && !strcmp(NameStr, "copysign")) \|\|
				3552	(NameLen == 9 && !strcmp(NameStr, "copysignf")))) {
				3553	if (I.getNumOperands() == 3 && // Basic sanity checks.
				3554	I.getOperand(1)->getType()->isFloatingPoint() &&
				3555	I.getType() == I.getOperand(1)->getType() &&
				3556	I.getType() == I.getOperand(2)->getType()) {
				3557	SDValue LHS = getValue(I.getOperand(1));
				3558	SDValue RHS = getValue(I.getOperand(2));
				3559	setValue(&I, DAG.getNode(ISD::FCOPYSIGN, LHS.getValueType(),
				3560	LHS, RHS));
				3561	return;
				3562	}
				3563	} else if (NameStr[0] == 'f' &&
				3564	((NameLen == 4 && !strcmp(NameStr, "fabs")) \|\|
				3565	(NameLen == 5 && !strcmp(NameStr, "fabsf")) \|\|
				3566	(NameLen == 5 && !strcmp(NameStr, "fabsl")))) {
				3567	if (I.getNumOperands() == 2 && // Basic sanity checks.
				3568	I.getOperand(1)->getType()->isFloatingPoint() &&
				3569	I.getType() == I.getOperand(1)->getType()) {
				3570	SDValue Tmp = getValue(I.getOperand(1));
				3571	setValue(&I, DAG.getNode(ISD::FABS, Tmp.getValueType(), Tmp));
				3572	return;
				3573	}
				3574	} else if (NameStr[0] == 's' &&
				3575	((NameLen == 3 && !strcmp(NameStr, "sin")) \|\|
				3576	(NameLen == 4 && !strcmp(NameStr, "sinf")) \|\|
				3577	(NameLen == 4 && !strcmp(NameStr, "sinl")))) {
				3578	if (I.getNumOperands() == 2 && // Basic sanity checks.
				3579	I.getOperand(1)->getType()->isFloatingPoint() &&
				3580	I.getType() == I.getOperand(1)->getType()) {
				3581	SDValue Tmp = getValue(I.getOperand(1));
				3582	setValue(&I, DAG.getNode(ISD::FSIN, Tmp.getValueType(), Tmp));
				3583	return;
				3584	}
				3585	} else if (NameStr[0] == 'c' &&
				3586	((NameLen == 3 && !strcmp(NameStr, "cos")) \|\|
				3587	(NameLen == 4 && !strcmp(NameStr, "cosf")) \|\|
				3588	(NameLen == 4 && !strcmp(NameStr, "cosl")))) {
				3589	if (I.getNumOperands() == 2 && // Basic sanity checks.
				3590	I.getOperand(1)->getType()->isFloatingPoint() &&
				3591	I.getType() == I.getOperand(1)->getType()) {
				3592	SDValue Tmp = getValue(I.getOperand(1));
				3593	setValue(&I, DAG.getNode(ISD::FCOS, Tmp.getValueType(), Tmp));
				3594	return;
				3595	}
				3596	}
				3597	}
				3598	} else if (isa<InlineAsm>(I.getOperand(0))) {
				3599	visitInlineAsm(&I);
				3600	return;
				3601	}
				3602
				3603	SDValue Callee;
				3604	if (!RenameFn)
				3605	Callee = getValue(I.getOperand(0));
				3606	else
				3607	Callee = DAG.getExternalSymbol(RenameFn, TLI.getPointerTy());
				3608
				3609	LowerCallTo(&I, Callee, I.isTailCall());
				3610	}
				3611
				3612
				3613	/// getCopyFromRegs - Emit a series of CopyFromReg nodes that copies from
				3614	/// this value and returns the result as a ValueVT value. This uses
				3615	/// Chain/Flag as the input and updates them for the output Chain/Flag.
				3616	/// If the Flag pointer is NULL, no flag is used.
				3617	SDValue RegsForValue::getCopyFromRegs(SelectionDAG &DAG,
				3618	SDValue &Chain,
				3619	SDValue *Flag) const {
				3620	// Assemble the legal parts into the final values.
				3621	SmallVector<SDValue, 4> Values(ValueVTs.size());
				3622	SmallVector<SDValue, 8> Parts;
				3623	for (unsigned Value = 0, Part = 0, e = ValueVTs.size(); Value != e; ++Value) {
				3624	// Copy the legal parts from the registers.
				3625	MVT ValueVT = ValueVTs[Value];
				3626	unsigned NumRegs = TLI->getNumRegisters(ValueVT);
				3627	MVT RegisterVT = RegVTs[Value];
				3628
				3629	Parts.resize(NumRegs);
				3630	for (unsigned i = 0; i != NumRegs; ++i) {
				3631	SDValue P;
				3632	if (Flag == 0)
				3633	P = DAG.getCopyFromReg(Chain, Regs[Part+i], RegisterVT);
				3634	else {
				3635	P = DAG.getCopyFromReg(Chain, Regs[Part+i], RegisterVT, *Flag);
				3636	*Flag = P.getValue(2);
				3637	}
				3638	Chain = P.getValue(1);
				3639
				3640	// If the source register was virtual and if we know something about it,
				3641	// add an assert node.
				3642	if (TargetRegisterInfo::isVirtualRegister(Regs[Part+i]) &&
				3643	RegisterVT.isInteger() && !RegisterVT.isVector()) {
				3644	unsigned SlotNo = Regs[Part+i]-TargetRegisterInfo::FirstVirtualRegister;
				3645	FunctionLoweringInfo &FLI = DAG.getFunctionLoweringInfo();
				3646	if (FLI.LiveOutRegInfo.size() > SlotNo) {
				3647	FunctionLoweringInfo::LiveOutInfo &LOI = FLI.LiveOutRegInfo[SlotNo];
				3648
				3649	unsigned RegSize = RegisterVT.getSizeInBits();
				3650	unsigned NumSignBits = LOI.NumSignBits;
				3651	unsigned NumZeroBits = LOI.KnownZero.countLeadingOnes();
				3652
				3653	// FIXME: We capture more information than the dag can represent. For
				3654	// now, just use the tightest assertzext/assertsext possible.
				3655	bool isSExt = true;
				3656	MVT FromVT(MVT::Other);
				3657	if (NumSignBits == RegSize)
				3658	isSExt = true, FromVT = MVT::i1; // ASSERT SEXT 1
				3659	else if (NumZeroBits >= RegSize-1)
				3660	isSExt = false, FromVT = MVT::i1; // ASSERT ZEXT 1
				3661	else if (NumSignBits > RegSize-8)
				3662	isSExt = true, FromVT = MVT::i8; // ASSERT SEXT 8
				3663	else if (NumZeroBits >= RegSize-9)
				3664	isSExt = false, FromVT = MVT::i8; // ASSERT ZEXT 8
				3665	else if (NumSignBits > RegSize-16)
				3666	isSExt = true, FromVT = MVT::i16; // ASSERT SEXT 16
				3667	else if (NumZeroBits >= RegSize-17)
				3668	isSExt = false, FromVT = MVT::i16; // ASSERT ZEXT 16
				3669	else if (NumSignBits > RegSize-32)
				3670	isSExt = true, FromVT = MVT::i32; // ASSERT SEXT 32
				3671	else if (NumZeroBits >= RegSize-33)
				3672	isSExt = false, FromVT = MVT::i32; // ASSERT ZEXT 32
				3673
				3674	if (FromVT != MVT::Other) {
				3675	P = DAG.getNode(isSExt ? ISD::AssertSext : ISD::AssertZext,
				3676	RegisterVT, P, DAG.getValueType(FromVT));
				3677
				3678	}
				3679	}
				3680	}
				3681
				3682	Parts[i] = P;
				3683	}
				3684
				3685	Values[Value] = getCopyFromParts(DAG, Parts.begin(), NumRegs, RegisterVT,
				3686	ValueVT);
				3687	Part += NumRegs;
				3688	Parts.clear();
				3689	}
				3690
				3691	return DAG.getMergeValues(DAG.getVTList(&ValueVTs[0], ValueVTs.size()),
				3692	&Values[0], ValueVTs.size());
				3693	}
				3694
				3695	/// getCopyToRegs - Emit a series of CopyToReg nodes that copies the
				3696	/// specified value into the registers specified by this object. This uses
				3697	/// Chain/Flag as the input and updates them for the output Chain/Flag.
				3698	/// If the Flag pointer is NULL, no flag is used.
				3699	void RegsForValue::getCopyToRegs(SDValue Val, SelectionDAG &DAG,
				3700	SDValue &Chain, SDValue *Flag) const {
				3701	// Get the list of the values's legal parts.
				3702	unsigned NumRegs = Regs.size();
				3703	SmallVector<SDValue, 8> Parts(NumRegs);
				3704	for (unsigned Value = 0, Part = 0, e = ValueVTs.size(); Value != e; ++Value) {
				3705	MVT ValueVT = ValueVTs[Value];
				3706	unsigned NumParts = TLI->getNumRegisters(ValueVT);
				3707	MVT RegisterVT = RegVTs[Value];
				3708
				3709	getCopyToParts(DAG, Val.getValue(Val.getResNo() + Value),
				3710	&Parts[Part], NumParts, RegisterVT);
				3711	Part += NumParts;
				3712	}
				3713
				3714	// Copy the parts into the registers.
				3715	SmallVector<SDValue, 8> Chains(NumRegs);
				3716	for (unsigned i = 0; i != NumRegs; ++i) {
				3717	SDValue Part;
				3718	if (Flag == 0)
				3719	Part = DAG.getCopyToReg(Chain, Regs[i], Parts[i]);
				3720	else {
				3721	Part = DAG.getCopyToReg(Chain, Regs[i], Parts[i], *Flag);
				3722	*Flag = Part.getValue(1);
				3723	}
				3724	Chains[i] = Part.getValue(0);
				3725	}
				3726
				3727	if (NumRegs == 1 \|\| Flag)
				3728	// If NumRegs > 1 && Flag is used then the use of the last CopyToReg is
				3729	// flagged to it. That is the CopyToReg nodes and the user are considered
				3730	// a single scheduling unit. If we create a TokenFactor and return it as
				3731	// chain, then the TokenFactor is both a predecessor (operand) of the
				3732	// user as well as a successor (the TF operands are flagged to the user).
				3733	// c1, f1 = CopyToReg
				3734	// c2, f2 = CopyToReg
				3735	// c3 = TokenFactor c1, c2
				3736	// ...
				3737	// = op c3, ..., f2
				3738	Chain = Chains[NumRegs-1];
				3739	else
				3740	Chain = DAG.getNode(ISD::TokenFactor, MVT::Other, &Chains[0], NumRegs);
				3741	}
				3742
				3743	/// AddInlineAsmOperands - Add this value to the specified inlineasm node
				3744	/// operand list. This adds the code marker and includes the number of
				3745	/// values added into it.
				3746	void RegsForValue::AddInlineAsmOperands(unsigned Code, SelectionDAG &DAG,
				3747	std::vector<SDValue> &Ops) const {
				3748	MVT IntPtrTy = DAG.getTargetLoweringInfo().getPointerTy();
				3749	Ops.push_back(DAG.getTargetConstant(Code \| (Regs.size() << 3), IntPtrTy));
				3750	for (unsigned Value = 0, Reg = 0, e = ValueVTs.size(); Value != e; ++Value) {
				3751	unsigned NumRegs = TLI->getNumRegisters(ValueVTs[Value]);
				3752	MVT RegisterVT = RegVTs[Value];
				3753	for (unsigned i = 0; i != NumRegs; ++i)
				3754	Ops.push_back(DAG.getRegister(Regs[Reg++], RegisterVT));
				3755	}
				3756	}
				3757
				3758	/// isAllocatableRegister - If the specified register is safe to allocate,
				3759	/// i.e. it isn't a stack pointer or some other special register, return the
				3760	/// register class for the register. Otherwise, return null.
				3761	static const TargetRegisterClass *
				3762	isAllocatableRegister(unsigned Reg, MachineFunction &MF,
				3763	const TargetLowering &TLI,
				3764	const TargetRegisterInfo *TRI) {
				3765	MVT FoundVT = MVT::Other;
				3766	const TargetRegisterClass *FoundRC = 0;
				3767	for (TargetRegisterInfo::regclass_iterator RCI = TRI->regclass_begin(),
				3768	E = TRI->regclass_end(); RCI != E; ++RCI) {
				3769	MVT ThisVT = MVT::Other;
				3770
				3771	const TargetRegisterClass RC = RCI;
				3772	// If none of the the value types for this register class are valid, we
				3773	// can't use it. For example, 64-bit reg classes on 32-bit targets.
				3774	for (TargetRegisterClass::vt_iterator I = RC->vt_begin(), E = RC->vt_end();
				3775	I != E; ++I) {
				3776	if (TLI.isTypeLegal(*I)) {
				3777	// If we have already found this register in a different register class,
				3778	// choose the one with the largest VT specified. For example, on
				3779	// PowerPC, we favor f64 register classes over f32.
				3780	if (FoundVT == MVT::Other \|\| FoundVT.bitsLT(*I)) {
				3781	ThisVT = *I;
				3782	break;
				3783	}
				3784	}
				3785	}
				3786
				3787	if (ThisVT == MVT::Other) continue;
				3788
				3789	// NOTE: This isn't ideal. In particular, this might allocate the
				3790	// frame pointer in functions that need it (due to them not being taken
				3791	// out of allocation, because a variable sized allocation hasn't been seen
				3792	// yet). This is a slight code pessimization, but should still work.
				3793	for (TargetRegisterClass::iterator I = RC->allocation_order_begin(MF),
				3794	E = RC->allocation_order_end(MF); I != E; ++I)
				3795	if (*I == Reg) {
				3796	// We found a matching register class. Keep looking at others in case
				3797	// we find one with larger registers that this physreg is also in.
				3798	FoundRC = RC;
				3799	FoundVT = ThisVT;
				3800	break;
				3801	}
				3802	}
				3803	return FoundRC;
				3804	}
				3805
				3806
				3807	namespace llvm {
				3808	/// AsmOperandInfo - This contains information for each constraint that we are
				3809	/// lowering.
				3810	struct SDISelAsmOperandInfo : public TargetLowering::AsmOperandInfo {
				3811	/// CallOperand - If this is the result output operand or a clobber
				3812	/// this is null, otherwise it is the incoming operand to the CallInst.
				3813	/// This gets modified as the asm is processed.
				3814	SDValue CallOperand;
				3815
				3816	/// AssignedRegs - If this is a register or register class operand, this
				3817	/// contains the set of register corresponding to the operand.
				3818	RegsForValue AssignedRegs;
				3819
				3820	explicit SDISelAsmOperandInfo(const InlineAsm::ConstraintInfo &info)
				3821	: TargetLowering::AsmOperandInfo(info), CallOperand(0,0) {
				3822	}
				3823
				3824	/// MarkAllocatedRegs - Once AssignedRegs is set, mark the assigned registers
				3825	/// busy in OutputRegs/InputRegs.
				3826	void MarkAllocatedRegs(bool isOutReg, bool isInReg,
				3827	std::set<unsigned> &OutputRegs,
				3828	std::set<unsigned> &InputRegs,
				3829	const TargetRegisterInfo &TRI) const {
				3830	if (isOutReg) {
				3831	for (unsigned i = 0, e = AssignedRegs.Regs.size(); i != e; ++i)
				3832	MarkRegAndAliases(AssignedRegs.Regs[i], OutputRegs, TRI);
				3833	}
				3834	if (isInReg) {
				3835	for (unsigned i = 0, e = AssignedRegs.Regs.size(); i != e; ++i)
				3836	MarkRegAndAliases(AssignedRegs.Regs[i], InputRegs, TRI);
				3837	}
				3838	}
				3839
				3840	private:
				3841	/// MarkRegAndAliases - Mark the specified register and all aliases in the
				3842	/// specified set.
				3843	static void MarkRegAndAliases(unsigned Reg, std::set<unsigned> &Regs,
				3844	const TargetRegisterInfo &TRI) {
				3845	assert(TargetRegisterInfo::isPhysicalRegister(Reg) && "Isn't a physreg");
				3846	Regs.insert(Reg);
				3847	if (const unsigned *Aliases = TRI.getAliasSet(Reg))
				3848	for (; *Aliases; ++Aliases)
				3849	Regs.insert(*Aliases);
				3850	}
				3851	};
				3852	} // end llvm namespace.
				3853
				3854
				3855	/// GetRegistersForValue - Assign registers (virtual or physical) for the
				3856	/// specified operand. We prefer to assign virtual registers, to allow the
				3857	/// register allocator handle the assignment process. However, if the asm uses
				3858	/// features that we can't model on machineinstrs, we have SDISel do the
				3859	/// allocation. This produces generally horrible, but correct, code.
				3860	///
				3861	/// OpInfo describes the operand.
				3862	/// HasEarlyClobber is true if there are any early clobber constraints (=&r)
				3863	/// or any explicitly clobbered registers.
				3864	/// Input and OutputRegs are the set of already allocated physical registers.
				3865	///
				3866	void SelectionDAGLowering::
				3867	GetRegistersForValue(SDISelAsmOperandInfo &OpInfo, bool HasEarlyClobber,
				3868	std::set<unsigned> &OutputRegs,
				3869	std::set<unsigned> &InputRegs) {
				3870	// Compute whether this value requires an input register, an output register,
				3871	// or both.
				3872	bool isOutReg = false;
				3873	bool isInReg = false;
				3874	switch (OpInfo.Type) {
				3875	case InlineAsm::isOutput:
				3876	isOutReg = true;
				3877
				3878	// If this is an early-clobber output, or if there is an input
				3879	// constraint that matches this, we need to reserve the input register
				3880	// so no other inputs allocate to it.
				3881	isInReg = OpInfo.isEarlyClobber \|\| OpInfo.hasMatchingInput;
				3882	break;
				3883	case InlineAsm::isInput:
				3884	isInReg = true;
				3885	isOutReg = false;
				3886	break;
				3887	case InlineAsm::isClobber:
				3888	isOutReg = true;
				3889	isInReg = true;
				3890	break;
				3891	}
				3892
				3893
				3894	MachineFunction &MF = DAG.getMachineFunction();
				3895	SmallVector<unsigned, 4> Regs;
				3896
				3897	// If this is a constraint for a single physreg, or a constraint for a
				3898	// register class, find it.
				3899	std::pair<unsigned, const TargetRegisterClass*> PhysReg =
				3900	TLI.getRegForInlineAsmConstraint(OpInfo.ConstraintCode,
				3901	OpInfo.ConstraintVT);
				3902
				3903	unsigned NumRegs = 1;
				3904	if (OpInfo.ConstraintVT != MVT::Other)
				3905	NumRegs = TLI.getNumRegisters(OpInfo.ConstraintVT);
				3906	MVT RegVT;
				3907	MVT ValueVT = OpInfo.ConstraintVT;
				3908
				3909
				3910	// If this is a constraint for a specific physical register, like {r17},
				3911	// assign it now.
				3912	if (PhysReg.first) {
				3913	if (OpInfo.ConstraintVT == MVT::Other)
				3914	ValueVT = *PhysReg.second->vt_begin();
				3915
				3916	// Get the actual register value type. This is important, because the user
				3917	// may have asked for (e.g.) the AX register in i32 type. We need to
				3918	// remember that AX is actually i16 to get the right extension.
				3919	RegVT = *PhysReg.second->vt_begin();
				3920
				3921	// This is a explicit reference to a physical register.
				3922	Regs.push_back(PhysReg.first);
				3923
				3924	// If this is an expanded reference, add the rest of the regs to Regs.
				3925	if (NumRegs != 1) {
				3926	TargetRegisterClass::iterator I = PhysReg.second->begin();
				3927	for (; *I != PhysReg.first; ++I)
				3928	assert(I != PhysReg.second->end() && "Didn't find reg!");
				3929
				3930	// Already added the first reg.
				3931	--NumRegs; ++I;
				3932	for (; NumRegs; --NumRegs, ++I) {
				3933	assert(I != PhysReg.second->end() && "Ran out of registers to allocate!");
				3934	Regs.push_back(*I);
				3935	}
				3936	}
				3937	OpInfo.AssignedRegs = RegsForValue(TLI, Regs, RegVT, ValueVT);
				3938	const TargetRegisterInfo *TRI = DAG.getTarget().getRegisterInfo();
				3939	OpInfo.MarkAllocatedRegs(isOutReg, isInReg, OutputRegs, InputRegs, *TRI);
				3940	return;
				3941	}
				3942
				3943	// Otherwise, if this was a reference to an LLVM register class, create vregs
				3944	// for this reference.
				3945	std::vector<unsigned> RegClassRegs;
				3946	const TargetRegisterClass *RC = PhysReg.second;
				3947	if (RC) {
				3948	// If this is an early clobber or tied register, our regalloc doesn't know
				3949	// how to maintain the constraint. If it isn't, go ahead and create vreg
				3950	// and let the regalloc do the right thing.
				3951	if (!OpInfo.hasMatchingInput && !OpInfo.isEarlyClobber &&
				3952	// If there is some other early clobber and this is an input register,
				3953	// then we are forced to pre-allocate the input reg so it doesn't
				3954	// conflict with the earlyclobber.
				3955	!(OpInfo.Type == InlineAsm::isInput && HasEarlyClobber)) {
				3956	RegVT = *PhysReg.second->vt_begin();
				3957
				3958	if (OpInfo.ConstraintVT == MVT::Other)
				3959	ValueVT = RegVT;
				3960
				3961	// Create the appropriate number of virtual registers.
				3962	MachineRegisterInfo &RegInfo = MF.getRegInfo();
				3963	for (; NumRegs; --NumRegs)
				3964	Regs.push_back(RegInfo.createVirtualRegister(PhysReg.second));
				3965
				3966	OpInfo.AssignedRegs = RegsForValue(TLI, Regs, RegVT, ValueVT);
				3967	return;
				3968	}
				3969
				3970	// Otherwise, we can't allocate it. Let the code below figure out how to
				3971	// maintain these constraints.
				3972	RegClassRegs.assign(PhysReg.second->begin(), PhysReg.second->end());
				3973
				3974	} else {
				3975	// This is a reference to a register class that doesn't directly correspond
				3976	// to an LLVM register class. Allocate NumRegs consecutive, available,
				3977	// registers from the class.
				3978	RegClassRegs = TLI.getRegClassForInlineAsmConstraint(OpInfo.ConstraintCode,
				3979	OpInfo.ConstraintVT);
				3980	}
				3981
				3982	const TargetRegisterInfo *TRI = DAG.getTarget().getRegisterInfo();
				3983	unsigned NumAllocated = 0;
				3984	for (unsigned i = 0, e = RegClassRegs.size(); i != e; ++i) {
				3985	unsigned Reg = RegClassRegs[i];
				3986	// See if this register is available.
				3987	if ((isOutReg && OutputRegs.count(Reg)) \|\| // Already used.
				3988	(isInReg && InputRegs.count(Reg))) { // Already used.
				3989	// Make sure we find consecutive registers.
				3990	NumAllocated = 0;
				3991	continue;
				3992	}
				3993
				3994	// Check to see if this register is allocatable (i.e. don't give out the
				3995	// stack pointer).
				3996	if (RC == 0) {
				3997	RC = isAllocatableRegister(Reg, MF, TLI, TRI);
				3998	if (!RC) { // Couldn't allocate this register.
				3999	// Reset NumAllocated to make sure we return consecutive registers.
				4000	NumAllocated = 0;
				4001	continue;
				4002	}
				4003	}
				4004
				4005	// Okay, this register is good, we can use it.
				4006	++NumAllocated;
				4007
				4008	// If we allocated enough consecutive registers, succeed.
				4009	if (NumAllocated == NumRegs) {
				4010	unsigned RegStart = (i-NumAllocated)+1;
				4011	unsigned RegEnd = i+1;
				4012	// Mark all of the allocated registers used.
				4013	for (unsigned i = RegStart; i != RegEnd; ++i)
				4014	Regs.push_back(RegClassRegs[i]);
				4015
				4016	OpInfo.AssignedRegs = RegsForValue(TLI, Regs, *RC->vt_begin(),
				4017	OpInfo.ConstraintVT);
				4018	OpInfo.MarkAllocatedRegs(isOutReg, isInReg, OutputRegs, InputRegs, *TRI);
				4019	return;
				4020	}
				4021	}
				4022
				4023	// Otherwise, we couldn't allocate enough registers for this.
				4024	}
				4025
				4026
				4027	/// visitInlineAsm - Handle a call to an InlineAsm object.
				4028	///
				4029	void SelectionDAGLowering::visitInlineAsm(CallSite CS) {
				4030	InlineAsm *IA = cast<InlineAsm>(CS.getCalledValue());
				4031
				4032	/// ConstraintOperands - Information about all of the constraints.
				4033	std::vector<SDISelAsmOperandInfo> ConstraintOperands;
				4034
				4035	SDValue Chain = getRoot();
				4036	SDValue Flag;
				4037
				4038	std::set<unsigned> OutputRegs, InputRegs;
				4039
				4040	// Do a prepass over the constraints, canonicalizing them, and building up the
				4041	// ConstraintOperands list.
				4042	std::vector<InlineAsm::ConstraintInfo>
				4043	ConstraintInfos = IA->ParseConstraints();
				4044
				4045	// SawEarlyClobber - Keep track of whether we saw an earlyclobber output
				4046	// constraint. If so, we can't let the register allocator allocate any input
				4047	// registers, because it will not know to avoid the earlyclobbered output reg.
				4048	bool SawEarlyClobber = false;
				4049
				4050	unsigned ArgNo = 0; // ArgNo - The argument of the CallInst.
				4051	unsigned ResNo = 0; // ResNo - The result number of the next output.
				4052	for (unsigned i = 0, e = ConstraintInfos.size(); i != e; ++i) {
				4053	ConstraintOperands.push_back(SDISelAsmOperandInfo(ConstraintInfos[i]));
				4054	SDISelAsmOperandInfo &OpInfo = ConstraintOperands.back();
				4055
				4056	MVT OpVT = MVT::Other;
				4057
				4058	// Compute the value type for each operand.
				4059	switch (OpInfo.Type) {
				4060	case InlineAsm::isOutput:
				4061	// Indirect outputs just consume an argument.
				4062	if (OpInfo.isIndirect) {
				4063	OpInfo.CallOperandVal = CS.getArgument(ArgNo++);
				4064	break;
				4065	}
				4066	// The return value of the call is this value. As such, there is no
				4067	// corresponding argument.
				4068	assert(CS.getType() != Type::VoidTy && "Bad inline asm!");
				4069	if (const StructType *STy = dyn_cast<StructType>(CS.getType())) {
				4070	OpVT = TLI.getValueType(STy->getElementType(ResNo));
				4071	} else {
				4072	assert(ResNo == 0 && "Asm only has one result!");
				4073	OpVT = TLI.getValueType(CS.getType());
				4074	}
				4075	++ResNo;
				4076	break;
				4077	case InlineAsm::isInput:
				4078	OpInfo.CallOperandVal = CS.getArgument(ArgNo++);
				4079	break;
				4080	case InlineAsm::isClobber:
				4081	// Nothing to do.
				4082	break;
				4083	}
				4084
				4085	// If this is an input or an indirect output, process the call argument.
				4086	// BasicBlocks are labels, currently appearing only in asm's.
				4087	if (OpInfo.CallOperandVal) {
				4088	if (BasicBlock *BB = dyn_cast<BasicBlock>(OpInfo.CallOperandVal))
				4089	OpInfo.CallOperand = DAG.getBasicBlock(FuncInfo.MBBMap[BB]);
				4090	else {
				4091	OpInfo.CallOperand = getValue(OpInfo.CallOperandVal);
				4092	const Type *OpTy = OpInfo.CallOperandVal->getType();
				4093	// If this is an indirect operand, the operand is a pointer to the
				4094	// accessed type.
				4095	if (OpInfo.isIndirect)
				4096	OpTy = cast<PointerType>(OpTy)->getElementType();
				4097
				4098	// If OpTy is not a single value, it may be a struct/union that we
				4099	// can tile with integers.
				4100	if (!OpTy->isSingleValueType() && OpTy->isSized()) {
				4101	unsigned BitSize = TD->getTypeSizeInBits(OpTy);
				4102	switch (BitSize) {
				4103	default: break;
				4104	case 1:
				4105	case 8:
				4106	case 16:
				4107	case 32:
				4108	case 64:
				4109	OpTy = IntegerType::get(BitSize);
				4110	break;
				4111	}
				4112	}
				4113
				4114	OpVT = TLI.getValueType(OpTy, true);
				4115	}
				4116	}
				4117
				4118	OpInfo.ConstraintVT = OpVT;
				4119
				4120	// Compute the constraint code and ConstraintType to use.
				4121	TLI.ComputeConstraintToUse(OpInfo, OpInfo.CallOperand, &DAG);
				4122
				4123	// Keep track of whether we see an earlyclobber.
				4124	SawEarlyClobber \|= OpInfo.isEarlyClobber;
				4125
				4126	// If we see a clobber of a register, it is an early clobber.
				4127	if (!SawEarlyClobber &&
				4128	OpInfo.Type == InlineAsm::isClobber &&
				4129	OpInfo.ConstraintType == TargetLowering::C_Register) {
				4130	// Note that we want to ignore things that we don't track here, like
				4131	// dirflag, fpsr, flags, etc.
				4132	std::pair<unsigned, const TargetRegisterClass*> PhysReg =
				4133	TLI.getRegForInlineAsmConstraint(OpInfo.ConstraintCode,
				4134	OpInfo.ConstraintVT);
				4135	if (PhysReg.first \|\| PhysReg.second) {
				4136	// This is a register we know of.
				4137	SawEarlyClobber = true;
				4138	}
				4139	}
				4140
				4141	// If this is a memory input, and if the operand is not indirect, do what we
				4142	// need to to provide an address for the memory input.
				4143	if (OpInfo.ConstraintType == TargetLowering::C_Memory &&
				4144	!OpInfo.isIndirect) {
				4145	assert(OpInfo.Type == InlineAsm::isInput &&
				4146	"Can only indirectify direct input operands!");
				4147
				4148	// Memory operands really want the address of the value. If we don't have
				4149	// an indirect input, put it in the constpool if we can, otherwise spill
				4150	// it to a stack slot.
				4151
				4152	// If the operand is a float, integer, or vector constant, spill to a
				4153	// constant pool entry to get its address.
				4154	Value *OpVal = OpInfo.CallOperandVal;
				4155	if (isa<ConstantFP>(OpVal) \|\| isa<ConstantInt>(OpVal) \|\|
				4156	isa<ConstantVector>(OpVal)) {
				4157	OpInfo.CallOperand = DAG.getConstantPool(cast<Constant>(OpVal),
				4158	TLI.getPointerTy());
				4159	} else {
				4160	// Otherwise, create a stack slot and emit a store to it before the
				4161	// asm.
				4162	const Type *Ty = OpVal->getType();
				4163	uint64_t TySize = TLI.getTargetData()->getABITypeSize(Ty);
				4164	unsigned Align = TLI.getTargetData()->getPrefTypeAlignment(Ty);
				4165	MachineFunction &MF = DAG.getMachineFunction();
				4166	int SSFI = MF.getFrameInfo()->CreateStackObject(TySize, Align);
				4167	SDValue StackSlot = DAG.getFrameIndex(SSFI, TLI.getPointerTy());
				4168	Chain = DAG.getStore(Chain, OpInfo.CallOperand, StackSlot, NULL, 0);
				4169	OpInfo.CallOperand = StackSlot;
				4170	}
				4171
				4172	// There is no longer a Value* corresponding to this operand.
				4173	OpInfo.CallOperandVal = 0;
				4174	// It is now an indirect operand.
				4175	OpInfo.isIndirect = true;
				4176	}
				4177
				4178	// If this constraint is for a specific register, allocate it before
				4179	// anything else.
				4180	if (OpInfo.ConstraintType == TargetLowering::C_Register)
				4181	GetRegistersForValue(OpInfo, SawEarlyClobber, OutputRegs, InputRegs);
				4182	}
				4183	ConstraintInfos.clear();
				4184
				4185
				4186	// Second pass - Loop over all of the operands, assigning virtual or physregs
				4187	// to registerclass operands.
				4188	for (unsigned i = 0, e = ConstraintOperands.size(); i != e; ++i) {
				4189	SDISelAsmOperandInfo &OpInfo = ConstraintOperands[i];
				4190
				4191	// C_Register operands have already been allocated, Other/Memory don't need
				4192	// to be.
				4193	if (OpInfo.ConstraintType == TargetLowering::C_RegisterClass)
				4194	GetRegistersForValue(OpInfo, SawEarlyClobber, OutputRegs, InputRegs);
				4195	}
				4196
				4197	// AsmNodeOperands - The operands for the ISD::INLINEASM node.
				4198	std::vector<SDValue> AsmNodeOperands;
				4199	AsmNodeOperands.push_back(SDValue()); // reserve space for input chain
				4200	AsmNodeOperands.push_back(
				4201	DAG.getTargetExternalSymbol(IA->getAsmString().c_str(), MVT::Other));
				4202
				4203
				4204	// Loop over all of the inputs, copying the operand values into the
				4205	// appropriate registers and processing the output regs.
				4206	RegsForValue RetValRegs;
				4207
				4208	// IndirectStoresToEmit - The set of stores to emit after the inline asm node.
				4209	std::vector<std::pair<RegsForValue, Value*> > IndirectStoresToEmit;
				4210
				4211	for (unsigned i = 0, e = ConstraintOperands.size(); i != e; ++i) {
				4212	SDISelAsmOperandInfo &OpInfo = ConstraintOperands[i];
				4213
				4214	switch (OpInfo.Type) {
				4215	case InlineAsm::isOutput: {
				4216	if (OpInfo.ConstraintType != TargetLowering::C_RegisterClass &&
				4217	OpInfo.ConstraintType != TargetLowering::C_Register) {
				4218	// Memory output, or 'other' output (e.g. 'X' constraint).
				4219	assert(OpInfo.isIndirect && "Memory output must be indirect operand");
				4220
				4221	// Add information to the INLINEASM node to know about this output.
				4222	unsigned ResOpType = 4/MEM/ \| (1 << 3);
				4223	AsmNodeOperands.push_back(DAG.getTargetConstant(ResOpType,
				4224	TLI.getPointerTy()));
				4225	AsmNodeOperands.push_back(OpInfo.CallOperand);
				4226	break;
				4227	}
				4228
				4229	// Otherwise, this is a register or register class output.
				4230
				4231	// Copy the output from the appropriate register. Find a register that
				4232	// we can use.
				4233	if (OpInfo.AssignedRegs.Regs.empty()) {
				4234	cerr << "Couldn't allocate output reg for constraint '"
				4235	<< OpInfo.ConstraintCode << "'!\n";
				4236	exit(1);
				4237	}
				4238
				4239	// If this is an indirect operand, store through the pointer after the
				4240	// asm.
				4241	if (OpInfo.isIndirect) {
				4242	IndirectStoresToEmit.push_back(std::make_pair(OpInfo.AssignedRegs,
				4243	OpInfo.CallOperandVal));
				4244	} else {
				4245	// This is the result value of the call.
				4246	assert(CS.getType() != Type::VoidTy && "Bad inline asm!");
				4247	// Concatenate this output onto the outputs list.
				4248	RetValRegs.append(OpInfo.AssignedRegs);
				4249	}
				4250
				4251	// Add information to the INLINEASM node to know that this register is
				4252	// set.
				4253	OpInfo.AssignedRegs.AddInlineAsmOperands(2 /REGDEF/, DAG,
				4254	AsmNodeOperands);
				4255	break;
				4256	}
				4257	case InlineAsm::isInput: {
				4258	SDValue InOperandVal = OpInfo.CallOperand;
				4259
				4260	if (isdigit(OpInfo.ConstraintCode[0])) { // Matching constraint?
				4261	// If this is required to match an output register we have already set,
				4262	// just use its register.
				4263	unsigned OperandNo = atoi(OpInfo.ConstraintCode.c_str());
				4264
				4265	// Scan until we find the definition we already emitted of this operand.
				4266	// When we find it, create a RegsForValue operand.
				4267	unsigned CurOp = 2; // The first operand.
				4268	for (; OperandNo; --OperandNo) {
				4269	// Advance to the next operand.
				4270	unsigned NumOps =
				4271	cast<ConstantSDNode>(AsmNodeOperands[CurOp])->getValue();
				4272	assert(((NumOps & 7) == 2 /REGDEF/ \|\|
				4273	(NumOps & 7) == 4 /MEM/) &&
				4274	"Skipped past definitions?");
				4275	CurOp += (NumOps>>3)+1;
				4276	}
				4277
				4278	unsigned NumOps =
				4279	cast<ConstantSDNode>(AsmNodeOperands[CurOp])->getValue();
				4280	if ((NumOps & 7) == 2 /REGDEF/) {
				4281	// Add NumOps>>3 registers to MatchedRegs.
				4282	RegsForValue MatchedRegs;
				4283	MatchedRegs.TLI = &TLI;
				4284	MatchedRegs.ValueVTs.push_back(InOperandVal.getValueType());
				4285	MatchedRegs.RegVTs.push_back(AsmNodeOperands[CurOp+1].getValueType());
				4286	for (unsigned i = 0, e = NumOps>>3; i != e; ++i) {
				4287	unsigned Reg =
				4288	cast<RegisterSDNode>(AsmNodeOperands[++CurOp])->getReg();
				4289	MatchedRegs.Regs.push_back(Reg);
				4290	}
				4291
				4292	// Use the produced MatchedRegs object to
				4293	MatchedRegs.getCopyToRegs(InOperandVal, DAG, Chain, &Flag);
				4294	MatchedRegs.AddInlineAsmOperands(1 /REGUSE/, DAG, AsmNodeOperands);
				4295	break;
				4296	} else {
				4297	assert((NumOps & 7) == 4/MEM/ && "Unknown matching constraint!");
				4298	assert((NumOps >> 3) == 1 && "Unexpected number of operands");
				4299	// Add information to the INLINEASM node to know about this input.
				4300	unsigned ResOpType = 4/MEM/ \| (1 << 3);
				4301	AsmNodeOperands.push_back(DAG.getTargetConstant(ResOpType,
				4302	TLI.getPointerTy()));
				4303	AsmNodeOperands.push_back(AsmNodeOperands[CurOp+1]);
				4304	break;
				4305	}
				4306	}
				4307
				4308	if (OpInfo.ConstraintType == TargetLowering::C_Other) {
				4309	assert(!OpInfo.isIndirect &&
				4310	"Don't know how to handle indirect other inputs yet!");
				4311
				4312	std::vector<SDValue> Ops;
				4313	TLI.LowerAsmOperandForConstraint(InOperandVal, OpInfo.ConstraintCode[0],
				4314	Ops, DAG);
				4315	if (Ops.empty()) {
				4316	cerr << "Invalid operand for inline asm constraint '"
				4317	<< OpInfo.ConstraintCode << "'!\n";
				4318	exit(1);
				4319	}
				4320
				4321	// Add information to the INLINEASM node to know about this input.
				4322	unsigned ResOpType = 3 /IMM/ \| (Ops.size() << 3);
				4323	AsmNodeOperands.push_back(DAG.getTargetConstant(ResOpType,
				4324	TLI.getPointerTy()));
				4325	AsmNodeOperands.insert(AsmNodeOperands.end(), Ops.begin(), Ops.end());
				4326	break;
				4327	} else if (OpInfo.ConstraintType == TargetLowering::C_Memory) {
				4328	assert(OpInfo.isIndirect && "Operand must be indirect to be a mem!");
				4329	assert(InOperandVal.getValueType() == TLI.getPointerTy() &&
				4330	"Memory operands expect pointer values");
				4331
				4332	// Add information to the INLINEASM node to know about this input.
				4333	unsigned ResOpType = 4/MEM/ \| (1 << 3);
				4334	AsmNodeOperands.push_back(DAG.getTargetConstant(ResOpType,
				4335	TLI.getPointerTy()));
				4336	AsmNodeOperands.push_back(InOperandVal);
				4337	break;
				4338	}
				4339
				4340	assert((OpInfo.ConstraintType == TargetLowering::C_RegisterClass \|\|
				4341	OpInfo.ConstraintType == TargetLowering::C_Register) &&
				4342	"Unknown constraint type!");
				4343	assert(!OpInfo.isIndirect &&
				4344	"Don't know how to handle indirect register inputs yet!");
				4345
				4346	// Copy the input into the appropriate registers.
				4347	assert(!OpInfo.AssignedRegs.Regs.empty() &&
				4348	"Couldn't allocate input reg!");
				4349
				4350	OpInfo.AssignedRegs.getCopyToRegs(InOperandVal, DAG, Chain, &Flag);
				4351
				4352	OpInfo.AssignedRegs.AddInlineAsmOperands(1/REGUSE/, DAG,
				4353	AsmNodeOperands);
				4354	break;
				4355	}
				4356	case InlineAsm::isClobber: {
				4357	// Add the clobbered value to the operand list, so that the register
				4358	// allocator is aware that the physreg got clobbered.
				4359	if (!OpInfo.AssignedRegs.Regs.empty())
				4360	OpInfo.AssignedRegs.AddInlineAsmOperands(2/REGDEF/, DAG,
				4361	AsmNodeOperands);
				4362	break;
				4363	}
				4364	}
				4365	}
				4366
				4367	// Finish up input operands.
				4368	AsmNodeOperands[0] = Chain;
				4369	if (Flag.getNode()) AsmNodeOperands.push_back(Flag);
				4370
				4371	Chain = DAG.getNode(ISD::INLINEASM,
				4372	DAG.getNodeValueTypes(MVT::Other, MVT::Flag), 2,
				4373	&AsmNodeOperands[0], AsmNodeOperands.size());
				4374	Flag = Chain.getValue(1);
				4375
				4376	// If this asm returns a register value, copy the result from that register
				4377	// and set it as the value of the call.
				4378	if (!RetValRegs.Regs.empty()) {
				4379	SDValue Val = RetValRegs.getCopyFromRegs(DAG, Chain, &Flag);
				4380
				4381	// If any of the results of the inline asm is a vector, it may have the
				4382	// wrong width/num elts. This can happen for register classes that can
				4383	// contain multiple different value types. The preg or vreg allocated may
				4384	// not have the same VT as was expected. Convert it to the right type with
				4385	// bit_convert.
				4386	if (const StructType *ResSTy = dyn_cast<StructType>(CS.getType())) {
				4387	for (unsigned i = 0, e = ResSTy->getNumElements(); i != e; ++i) {
				4388	if (Val.getNode()->getValueType(i).isVector())
				4389	Val = DAG.getNode(ISD::BIT_CONVERT,
				4390	TLI.getValueType(ResSTy->getElementType(i)), Val);
				4391	}
				4392	} else {
				4393	if (Val.getValueType().isVector())
				4394	Val = DAG.getNode(ISD::BIT_CONVERT, TLI.getValueType(CS.getType()),
				4395	Val);
				4396	}
				4397
				4398	setValue(CS.getInstruction(), Val);
				4399	}
				4400
				4401	std::vector<std::pair<SDValue, Value*> > StoresToEmit;
				4402
				4403	// Process indirect outputs, first output all of the flagged copies out of
				4404	// physregs.
				4405	for (unsigned i = 0, e = IndirectStoresToEmit.size(); i != e; ++i) {
				4406	RegsForValue &OutRegs = IndirectStoresToEmit[i].first;
				4407	Value *Ptr = IndirectStoresToEmit[i].second;
				4408	SDValue OutVal = OutRegs.getCopyFromRegs(DAG, Chain, &Flag);
				4409	StoresToEmit.push_back(std::make_pair(OutVal, Ptr));
				4410	}
				4411
				4412	// Emit the non-flagged stores from the physregs.
				4413	SmallVector<SDValue, 8> OutChains;
				4414	for (unsigned i = 0, e = StoresToEmit.size(); i != e; ++i)
				4415	OutChains.push_back(DAG.getStore(Chain, StoresToEmit[i].first,
				4416	getValue(StoresToEmit[i].second),
				4417	StoresToEmit[i].second, 0));
				4418	if (!OutChains.empty())
				4419	Chain = DAG.getNode(ISD::TokenFactor, MVT::Other,
				4420	&OutChains[0], OutChains.size());
				4421	DAG.setRoot(Chain);
				4422	}
				4423
				4424
				4425	void SelectionDAGLowering::visitMalloc(MallocInst &I) {
				4426	SDValue Src = getValue(I.getOperand(0));
				4427
				4428	MVT IntPtr = TLI.getPointerTy();
				4429
				4430	if (IntPtr.bitsLT(Src.getValueType()))
				4431	Src = DAG.getNode(ISD::TRUNCATE, IntPtr, Src);
				4432	else if (IntPtr.bitsGT(Src.getValueType()))
				4433	Src = DAG.getNode(ISD::ZERO_EXTEND, IntPtr, Src);
				4434
				4435	// Scale the source by the type size.
				4436	uint64_t ElementSize = TD->getABITypeSize(I.getType()->getElementType());
				4437	Src = DAG.getNode(ISD::MUL, Src.getValueType(),
				4438	Src, DAG.getIntPtrConstant(ElementSize));
				4439
				4440	TargetLowering::ArgListTy Args;
				4441	TargetLowering::ArgListEntry Entry;
				4442	Entry.Node = Src;
				4443	Entry.Ty = TLI.getTargetData()->getIntPtrType();
				4444	Args.push_back(Entry);
				4445
				4446	std::pair<SDValue,SDValue> Result =
				4447	TLI.LowerCallTo(getRoot(), I.getType(), false, false, false, CallingConv::C,
				4448	true, DAG.getExternalSymbol("malloc", IntPtr), Args, DAG);
				4449	setValue(&I, Result.first); // Pointers always fit in registers
				4450	DAG.setRoot(Result.second);
				4451	}
				4452
				4453	void SelectionDAGLowering::visitFree(FreeInst &I) {
				4454	TargetLowering::ArgListTy Args;
				4455	TargetLowering::ArgListEntry Entry;
				4456	Entry.Node = getValue(I.getOperand(0));
				4457	Entry.Ty = TLI.getTargetData()->getIntPtrType();
				4458	Args.push_back(Entry);
				4459	MVT IntPtr = TLI.getPointerTy();
				4460	std::pair<SDValue,SDValue> Result =
				4461	TLI.LowerCallTo(getRoot(), Type::VoidTy, false, false, false,
				4462	CallingConv::C, true,
				4463	DAG.getExternalSymbol("free", IntPtr), Args, DAG);
				4464	DAG.setRoot(Result.second);
				4465	}
				4466
				4467	void SelectionDAGLowering::visitVAStart(CallInst &I) {
				4468	DAG.setRoot(DAG.getNode(ISD::VASTART, MVT::Other, getRoot(),
				4469	getValue(I.getOperand(1)),
				4470	DAG.getSrcValue(I.getOperand(1))));
				4471	}
				4472
				4473	void SelectionDAGLowering::visitVAArg(VAArgInst &I) {
				4474	SDValue V = DAG.getVAArg(TLI.getValueType(I.getType()), getRoot(),
				4475	getValue(I.getOperand(0)),
				4476	DAG.getSrcValue(I.getOperand(0)));
				4477	setValue(&I, V);
				4478	DAG.setRoot(V.getValue(1));
				4479	}
				4480
				4481	void SelectionDAGLowering::visitVAEnd(CallInst &I) {
				4482	DAG.setRoot(DAG.getNode(ISD::VAEND, MVT::Other, getRoot(),
				4483	getValue(I.getOperand(1)),
				4484	DAG.getSrcValue(I.getOperand(1))));
				4485	}
				4486
				4487	void SelectionDAGLowering::visitVACopy(CallInst &I) {
				4488	DAG.setRoot(DAG.getNode(ISD::VACOPY, MVT::Other, getRoot(),
				4489	getValue(I.getOperand(1)),
				4490	getValue(I.getOperand(2)),
				4491	DAG.getSrcValue(I.getOperand(1)),
				4492	DAG.getSrcValue(I.getOperand(2))));
				4493	}
				4494
				4495	/// TargetLowering::LowerArguments - This is the default LowerArguments
				4496	/// implementation, which just inserts a FORMAL_ARGUMENTS node. FIXME: When all
				4497	/// targets are migrated to using FORMAL_ARGUMENTS, this hook should be
				4498	/// integrated into SDISel.
				4499	void TargetLowering::LowerArguments(Function &F, SelectionDAG &DAG,
				4500	SmallVectorImpl<SDValue> &ArgValues) {
				4501	// Add CC# and isVararg as operands to the FORMAL_ARGUMENTS node.
				4502	SmallVector<SDValue, 3+16> Ops;
				4503	Ops.push_back(DAG.getRoot());
				4504	Ops.push_back(DAG.getConstant(F.getCallingConv(), getPointerTy()));
				4505	Ops.push_back(DAG.getConstant(F.isVarArg(), getPointerTy()));
				4506
				4507	// Add one result value for each formal argument.
				4508	SmallVector<MVT, 16> RetVals;
				4509	unsigned j = 1;
				4510	for (Function::arg_iterator I = F.arg_begin(), E = F.arg_end();
				4511	I != E; ++I, ++j) {
				4512	SmallVector<MVT, 4> ValueVTs;
				4513	ComputeValueVTs(*this, I->getType(), ValueVTs);
				4514	for (unsigned Value = 0, NumValues = ValueVTs.size();
				4515	Value != NumValues; ++Value) {
				4516	MVT VT = ValueVTs[Value];
				4517	const Type *ArgTy = VT.getTypeForMVT();
				4518	ISD::ArgFlagsTy Flags;
				4519	unsigned OriginalAlignment =
				4520	getTargetData()->getABITypeAlignment(ArgTy);
				4521
				4522	if (F.paramHasAttr(j, ParamAttr::ZExt))
				4523	Flags.setZExt();
				4524	if (F.paramHasAttr(j, ParamAttr::SExt))
				4525	Flags.setSExt();
				4526	if (F.paramHasAttr(j, ParamAttr::InReg))
				4527	Flags.setInReg();
				4528	if (F.paramHasAttr(j, ParamAttr::StructRet))
				4529	Flags.setSRet();
				4530	if (F.paramHasAttr(j, ParamAttr::ByVal)) {
				4531	Flags.setByVal();
				4532	const PointerType *Ty = cast<PointerType>(I->getType());
				4533	const Type *ElementTy = Ty->getElementType();
				4534	unsigned FrameAlign = getByValTypeAlignment(ElementTy);
				4535	unsigned FrameSize = getTargetData()->getABITypeSize(ElementTy);
				4536	// For ByVal, alignment should be passed from FE. BE will guess if
				4537	// this info is not there but there are cases it cannot get right.
				4538	if (F.getParamAlignment(j))
				4539	FrameAlign = F.getParamAlignment(j);
				4540	Flags.setByValAlign(FrameAlign);
				4541	Flags.setByValSize(FrameSize);
				4542	}
				4543	if (F.paramHasAttr(j, ParamAttr::Nest))
				4544	Flags.setNest();
				4545	Flags.setOrigAlign(OriginalAlignment);
				4546
				4547	MVT RegisterVT = getRegisterType(VT);
				4548	unsigned NumRegs = getNumRegisters(VT);
				4549	for (unsigned i = 0; i != NumRegs; ++i) {
				4550	RetVals.push_back(RegisterVT);
				4551	ISD::ArgFlagsTy MyFlags = Flags;
				4552	if (NumRegs > 1 && i == 0)
				4553	MyFlags.setSplit();
				4554	// if it isn't first piece, alignment must be 1
				4555	else if (i > 0)
				4556	MyFlags.setOrigAlign(1);
				4557	Ops.push_back(DAG.getArgFlags(MyFlags));
				4558	}
				4559	}
				4560	}
				4561
				4562	RetVals.push_back(MVT::Other);
				4563
				4564	// Create the node.
				4565	SDNode *Result = DAG.getNode(ISD::FORMAL_ARGUMENTS,
				4566	DAG.getVTList(&RetVals[0], RetVals.size()),
				4567	&Ops[0], Ops.size()).getNode();
				4568
				4569	// Prelower FORMAL_ARGUMENTS. This isn't required for functionality, but
				4570	// allows exposing the loads that may be part of the argument access to the
				4571	// first DAGCombiner pass.
				4572	SDValue TmpRes = LowerOperation(SDValue(Result, 0), DAG);
				4573
				4574	// The number of results should match up, except that the lowered one may have
				4575	// an extra flag result.
				4576	assert((Result->getNumValues() == TmpRes.getNode()->getNumValues() \|\|
				4577	(Result->getNumValues()+1 == TmpRes.getNode()->getNumValues() &&
				4578	TmpRes.getValue(Result->getNumValues()).getValueType() == MVT::Flag))
				4579	&& "Lowering produced unexpected number of results!");
				4580
				4581	// The FORMAL_ARGUMENTS node itself is likely no longer needed.
				4582	if (Result != TmpRes.getNode() && Result->use_empty()) {
				4583	HandleSDNode Dummy(DAG.getRoot());
				4584	DAG.RemoveDeadNode(Result);
				4585	}
				4586
				4587	Result = TmpRes.getNode();
				4588
				4589	unsigned NumArgRegs = Result->getNumValues() - 1;
				4590	DAG.setRoot(SDValue(Result, NumArgRegs));
				4591
				4592	// Set up the return result vector.
				4593	unsigned i = 0;
				4594	unsigned Idx = 1;
				4595	for (Function::arg_iterator I = F.arg_begin(), E = F.arg_end(); I != E;
				4596	++I, ++Idx) {
				4597	SmallVector<MVT, 4> ValueVTs;
				4598	ComputeValueVTs(*this, I->getType(), ValueVTs);
				4599	for (unsigned Value = 0, NumValues = ValueVTs.size();
				4600	Value != NumValues; ++Value) {
				4601	MVT VT = ValueVTs[Value];
				4602	MVT PartVT = getRegisterType(VT);
				4603
				4604	unsigned NumParts = getNumRegisters(VT);
				4605	SmallVector<SDValue, 4> Parts(NumParts);
				4606	for (unsigned j = 0; j != NumParts; ++j)
				4607	Parts[j] = SDValue(Result, i++);
				4608
				4609	ISD::NodeType AssertOp = ISD::DELETED_NODE;
				4610	if (F.paramHasAttr(Idx, ParamAttr::SExt))
				4611	AssertOp = ISD::AssertSext;
				4612	else if (F.paramHasAttr(Idx, ParamAttr::ZExt))
				4613	AssertOp = ISD::AssertZext;
				4614
				4615	ArgValues.push_back(getCopyFromParts(DAG, &Parts[0], NumParts, PartVT, VT,
				4616	AssertOp));
				4617	}
				4618	}
				4619	assert(i == NumArgRegs && "Argument register count mismatch!");
				4620	}
				4621
				4622
				4623	/// TargetLowering::LowerCallTo - This is the default LowerCallTo
				4624	/// implementation, which just inserts an ISD::CALL node, which is later custom
				4625	/// lowered by the target to something concrete. FIXME: When all targets are
				4626	/// migrated to using ISD::CALL, this hook should be integrated into SDISel.
				4627	std::pair<SDValue, SDValue>
				4628	TargetLowering::LowerCallTo(SDValue Chain, const Type *RetTy,
				4629	bool RetSExt, bool RetZExt, bool isVarArg,
				4630	unsigned CallingConv, bool isTailCall,
				4631	SDValue Callee,
				4632	ArgListTy &Args, SelectionDAG &DAG) {
				4633	SmallVector<SDValue, 32> Ops;
				4634	Ops.push_back(Chain); // Op#0 - Chain
				4635	Ops.push_back(DAG.getConstant(CallingConv, getPointerTy())); // Op#1 - CC
				4636	Ops.push_back(DAG.getConstant(isVarArg, getPointerTy())); // Op#2 - VarArg
				4637	Ops.push_back(DAG.getConstant(isTailCall, getPointerTy())); // Op#3 - Tail
				4638	Ops.push_back(Callee);
				4639
				4640	// Handle all of the outgoing arguments.
				4641	for (unsigned i = 0, e = Args.size(); i != e; ++i) {
				4642	SmallVector<MVT, 4> ValueVTs;
				4643	ComputeValueVTs(*this, Args[i].Ty, ValueVTs);
				4644	for (unsigned Value = 0, NumValues = ValueVTs.size();
				4645	Value != NumValues; ++Value) {
				4646	MVT VT = ValueVTs[Value];
				4647	const Type *ArgTy = VT.getTypeForMVT();
				4648	SDValue Op = SDValue(Args[i].Node.getNode(), Args[i].Node.getResNo() + Value);
				4649	ISD::ArgFlagsTy Flags;
				4650	unsigned OriginalAlignment =
				4651	getTargetData()->getABITypeAlignment(ArgTy);
				4652
				4653	if (Args[i].isZExt)
				4654	Flags.setZExt();
				4655	if (Args[i].isSExt)
				4656	Flags.setSExt();
				4657	if (Args[i].isInReg)
				4658	Flags.setInReg();
				4659	if (Args[i].isSRet)
				4660	Flags.setSRet();
				4661	if (Args[i].isByVal) {
				4662	Flags.setByVal();
				4663	const PointerType *Ty = cast<PointerType>(Args[i].Ty);
				4664	const Type *ElementTy = Ty->getElementType();
				4665	unsigned FrameAlign = getByValTypeAlignment(ElementTy);
				4666	unsigned FrameSize = getTargetData()->getABITypeSize(ElementTy);
				4667	// For ByVal, alignment should come from FE. BE will guess if this
				4668	// info is not there but there are cases it cannot get right.
				4669	if (Args[i].Alignment)
				4670	FrameAlign = Args[i].Alignment;
				4671	Flags.setByValAlign(FrameAlign);
				4672	Flags.setByValSize(FrameSize);
				4673	}
				4674	if (Args[i].isNest)
				4675	Flags.setNest();
				4676	Flags.setOrigAlign(OriginalAlignment);
				4677
				4678	MVT PartVT = getRegisterType(VT);
				4679	unsigned NumParts = getNumRegisters(VT);
				4680	SmallVector<SDValue, 4> Parts(NumParts);
				4681	ISD::NodeType ExtendKind = ISD::ANY_EXTEND;
				4682
				4683	if (Args[i].isSExt)
				4684	ExtendKind = ISD::SIGN_EXTEND;
				4685	else if (Args[i].isZExt)
				4686	ExtendKind = ISD::ZERO_EXTEND;
				4687
				4688	getCopyToParts(DAG, Op, &Parts[0], NumParts, PartVT, ExtendKind);
				4689
				4690	for (unsigned i = 0; i != NumParts; ++i) {
				4691	// if it isn't first piece, alignment must be 1
				4692	ISD::ArgFlagsTy MyFlags = Flags;
				4693	if (NumParts > 1 && i == 0)
				4694	MyFlags.setSplit();
				4695	else if (i != 0)
				4696	MyFlags.setOrigAlign(1);
				4697
				4698	Ops.push_back(Parts[i]);
				4699	Ops.push_back(DAG.getArgFlags(MyFlags));
				4700	}
				4701	}
				4702	}
				4703
				4704	// Figure out the result value types. We start by making a list of
				4705	// the potentially illegal return value types.
				4706	SmallVector<MVT, 4> LoweredRetTys;
				4707	SmallVector<MVT, 4> RetTys;
				4708	ComputeValueVTs(*this, RetTy, RetTys);
				4709
				4710	// Then we translate that to a list of legal types.
				4711	for (unsigned I = 0, E = RetTys.size(); I != E; ++I) {
				4712	MVT VT = RetTys[I];
				4713	MVT RegisterVT = getRegisterType(VT);
				4714	unsigned NumRegs = getNumRegisters(VT);
				4715	for (unsigned i = 0; i != NumRegs; ++i)
				4716	LoweredRetTys.push_back(RegisterVT);
				4717	}
				4718
				4719	LoweredRetTys.push_back(MVT::Other); // Always has a chain.
				4720
				4721	// Create the CALL node.
				4722	SDValue Res = DAG.getNode(ISD::CALL,
				4723	DAG.getVTList(&LoweredRetTys[0],
				4724	LoweredRetTys.size()),
				4725	&Ops[0], Ops.size());
				4726	Chain = Res.getValue(LoweredRetTys.size() - 1);
				4727
				4728	// Gather up the call result into a single value.
				4729	if (RetTy != Type::VoidTy) {
				4730	ISD::NodeType AssertOp = ISD::DELETED_NODE;
				4731
				4732	if (RetSExt)
				4733	AssertOp = ISD::AssertSext;
				4734	else if (RetZExt)
				4735	AssertOp = ISD::AssertZext;
				4736
				4737	SmallVector<SDValue, 4> ReturnValues;
				4738	unsigned RegNo = 0;
				4739	for (unsigned I = 0, E = RetTys.size(); I != E; ++I) {
				4740	MVT VT = RetTys[I];
				4741	MVT RegisterVT = getRegisterType(VT);
				4742	unsigned NumRegs = getNumRegisters(VT);
				4743	unsigned RegNoEnd = NumRegs + RegNo;
				4744	SmallVector<SDValue, 4> Results;
				4745	for (; RegNo != RegNoEnd; ++RegNo)
				4746	Results.push_back(Res.getValue(RegNo));
				4747	SDValue ReturnValue =
				4748	getCopyFromParts(DAG, &Results[0], NumRegs, RegisterVT, VT,
				4749	AssertOp);
				4750	ReturnValues.push_back(ReturnValue);
				4751	}
				4752	Res = DAG.getMergeValues(DAG.getVTList(&RetTys[0], RetTys.size()),
				4753	&ReturnValues[0], ReturnValues.size());
				4754	}
				4755
				4756	return std::make_pair(Res, Chain);
				4757	}
				4758
				4759	SDValue TargetLowering::LowerOperation(SDValue Op, SelectionDAG &DAG) {
				4760	assert(0 && "LowerOperation not implemented for this target!");
				4761	abort();
				4762	return SDValue();
				4763	}
				4764
				4765
				4766	void SelectionDAGLowering::CopyValueToVirtualRegister(Value *V, unsigned Reg) {
				4767	SDValue Op = getValue(V);
				4768	assert((Op.getOpcode() != ISD::CopyFromReg \|\|
				4769	cast<RegisterSDNode>(Op.getOperand(1))->getReg() != Reg) &&
				4770	"Copy from a reg to the same reg!");
				4771	assert(!TargetRegisterInfo::isPhysicalRegister(Reg) && "Is a physreg");
				4772
				4773	RegsForValue RFV(TLI, Reg, V->getType());
				4774	SDValue Chain = DAG.getEntryNode();
				4775	RFV.getCopyToRegs(Op, DAG, Chain, 0);
				4776	PendingExports.push_back(Chain);
				4777	}
				4778
				4779	#include "llvm/CodeGen/SelectionDAGISel.h"
				4780
				4781	void SelectionDAGISel::
				4782	LowerArguments(BasicBlock *LLVMBB) {
				4783	// If this is the entry block, emit arguments.
				4784	Function &F = *LLVMBB->getParent();
				4785	SDValue OldRoot = SDL->DAG.getRoot();
				4786	SmallVector<SDValue, 16> Args;
				4787	TLI.LowerArguments(F, SDL->DAG, Args);
				4788
				4789	unsigned a = 0;
				4790	for (Function::arg_iterator AI = F.arg_begin(), E = F.arg_end();
				4791	AI != E; ++AI) {
				4792	SmallVector<MVT, 4> ValueVTs;
				4793	ComputeValueVTs(TLI, AI->getType(), ValueVTs);
				4794	unsigned NumValues = ValueVTs.size();
				4795	if (!AI->use_empty()) {
				4796	SDL->setValue(AI, SDL->DAG.getMergeValues(&Args[a], NumValues));
				4797	// If this argument is live outside of the entry block, insert a copy from
				4798	// whereever we got it to the vreg that other BB's will reference it as.
				4799	DenseMap<const Value*, unsigned>::iterator VMI=FuncInfo->ValueMap.find(AI);
				4800	if (VMI != FuncInfo->ValueMap.end()) {
				4801	SDL->CopyValueToVirtualRegister(AI, VMI->second);
				4802	}
				4803	}
				4804	a += NumValues;
				4805	}
				4806
				4807	// Finally, if the target has anything special to do, allow it to do so.
				4808	// FIXME: this should insert code into the DAG!
				4809	EmitFunctionEntryCode(F, SDL->DAG.getMachineFunction());
				4810	}
				4811
				4812	/// Handle PHI nodes in successor blocks. Emit code into the SelectionDAG to
				4813	/// ensure constants are generated when needed. Remember the virtual registers
				4814	/// that need to be added to the Machine PHI nodes as input. We cannot just
				4815	/// directly add them, because expansion might result in multiple MBB's for one
				4816	/// BB. As such, the start of the BB might correspond to a different MBB than
				4817	/// the end.
				4818	///
				4819	void
				4820	SelectionDAGISel::HandlePHINodesInSuccessorBlocks(BasicBlock *LLVMBB) {
				4821	TerminatorInst *TI = LLVMBB->getTerminator();
				4822
				4823	SmallPtrSet<MachineBasicBlock *, 4> SuccsHandled;
				4824
				4825	// Check successor nodes' PHI nodes that expect a constant to be available
				4826	// from this block.
				4827	for (unsigned succ = 0, e = TI->getNumSuccessors(); succ != e; ++succ) {
				4828	BasicBlock *SuccBB = TI->getSuccessor(succ);
				4829	if (!isa<PHINode>(SuccBB->begin())) continue;
				4830	MachineBasicBlock *SuccMBB = FuncInfo->MBBMap[SuccBB];
				4831
				4832	// If this terminator has multiple identical successors (common for
				4833	// switches), only handle each succ once.
				4834	if (!SuccsHandled.insert(SuccMBB)) continue;
				4835
				4836	MachineBasicBlock::iterator MBBI = SuccMBB->begin();
				4837	PHINode *PN;
				4838
				4839	// At this point we know that there is a 1-1 correspondence between LLVM PHI
				4840	// nodes and Machine PHI nodes, but the incoming operands have not been
				4841	// emitted yet.
				4842	for (BasicBlock::iterator I = SuccBB->begin();
				4843	(PN = dyn_cast<PHINode>(I)); ++I) {
				4844	// Ignore dead phi's.
				4845	if (PN->use_empty()) continue;
				4846
				4847	unsigned Reg;
				4848	Value *PHIOp = PN->getIncomingValueForBlock(LLVMBB);
				4849
				4850	if (Constant *C = dyn_cast<Constant>(PHIOp)) {
				4851	unsigned &RegOut = SDL->ConstantsOut[C];
				4852	if (RegOut == 0) {
				4853	RegOut = FuncInfo->CreateRegForValue(C);
				4854	SDL->CopyValueToVirtualRegister(C, RegOut);
				4855	}
				4856	Reg = RegOut;
				4857	} else {
				4858	Reg = FuncInfo->ValueMap[PHIOp];
				4859	if (Reg == 0) {
				4860	assert(isa<AllocaInst>(PHIOp) &&
				4861	FuncInfo->StaticAllocaMap.count(cast<AllocaInst>(PHIOp)) &&
				4862	"Didn't codegen value into a register!??");
				4863	Reg = FuncInfo->CreateRegForValue(PHIOp);
				4864	SDL->CopyValueToVirtualRegister(PHIOp, Reg);
				4865	}
				4866	}
				4867
				4868	// Remember that this register needs to added to the machine PHI node as
				4869	// the input for this MBB.
				4870	SmallVector<MVT, 4> ValueVTs;
				4871	ComputeValueVTs(TLI, PN->getType(), ValueVTs);
				4872	for (unsigned vti = 0, vte = ValueVTs.size(); vti != vte; ++vti) {
				4873	MVT VT = ValueVTs[vti];
				4874	unsigned NumRegisters = TLI.getNumRegisters(VT);
				4875	for (unsigned i = 0, e = NumRegisters; i != e; ++i)
				4876	SDL->PHINodesToUpdate.push_back(std::make_pair(MBBI++, Reg+i));
				4877	Reg += NumRegisters;
				4878	}
				4879	}
				4880	}
				4881	SDL->ConstantsOut.clear();
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	4882	}
				4883
Dan Gohman	3df24e6	2008-09-03 23:12:08 +0000	[diff] [blame]	4884	/// This is the Fast-ISel version of HandlePHINodesInSuccessorBlocks. It only
				4885	/// supports legal types, and it emits MachineInstrs directly instead of
				4886	/// creating SelectionDAG nodes.
				4887	///
				4888	bool
				4889	SelectionDAGISel::HandlePHINodesInSuccessorBlocksFast(BasicBlock *LLVMBB,
				4890	FastISel *F) {
				4891	TerminatorInst *TI = LLVMBB->getTerminator();
Dan Gohman	f0cbcd4	2008-09-03 16:12:24 +0000	[diff] [blame]	4892
Dan Gohman	3df24e6	2008-09-03 23:12:08 +0000	[diff] [blame]	4893	SmallPtrSet<MachineBasicBlock *, 4> SuccsHandled;
				4894	unsigned OrigNumPHINodesToUpdate = SDL->PHINodesToUpdate.size();
				4895
				4896	// Check successor nodes' PHI nodes that expect a constant to be available
				4897	// from this block.
				4898	for (unsigned succ = 0, e = TI->getNumSuccessors(); succ != e; ++succ) {
				4899	BasicBlock *SuccBB = TI->getSuccessor(succ);
				4900	if (!isa<PHINode>(SuccBB->begin())) continue;
				4901	MachineBasicBlock *SuccMBB = FuncInfo->MBBMap[SuccBB];
				4902
				4903	// If this terminator has multiple identical successors (common for
				4904	// switches), only handle each succ once.
				4905	if (!SuccsHandled.insert(SuccMBB)) continue;
				4906
				4907	MachineBasicBlock::iterator MBBI = SuccMBB->begin();
				4908	PHINode *PN;
				4909
				4910	// At this point we know that there is a 1-1 correspondence between LLVM PHI
				4911	// nodes and Machine PHI nodes, but the incoming operands have not been
				4912	// emitted yet.
				4913	for (BasicBlock::iterator I = SuccBB->begin();
				4914	(PN = dyn_cast<PHINode>(I)); ++I) {
				4915	// Ignore dead phi's.
				4916	if (PN->use_empty()) continue;
				4917
				4918	// Only handle legal types. Two interesting things to note here. First,
				4919	// by bailing out early, we may leave behind some dead instructions,
				4920	// since SelectionDAG's HandlePHINodesInSuccessorBlocks will insert its
				4921	// own moves. Second, this check is necessary becuase FastISel doesn't
				4922	// use CreateRegForValue to create registers, so it always creates
				4923	// exactly one register for each non-void instruction.
				4924	MVT VT = TLI.getValueType(PN->getType(), /AllowUnknown=/true);
				4925	if (VT == MVT::Other \|\| !TLI.isTypeLegal(VT)) {
				4926	SDL->PHINodesToUpdate.resize(OrigNumPHINodesToUpdate);
				4927	return false;
				4928	}
				4929
				4930	Value *PHIOp = PN->getIncomingValueForBlock(LLVMBB);
				4931
				4932	unsigned Reg = F->getRegForValue(PHIOp);
				4933	if (Reg == 0) {
				4934	SDL->PHINodesToUpdate.resize(OrigNumPHINodesToUpdate);
				4935	return false;
				4936	}
				4937	SDL->PHINodesToUpdate.push_back(std::make_pair(MBBI++, Reg));
				4938	}
				4939	}
				4940
				4941	return true;
				4942	}