Blame - lib/Transforms/InstCombine/InstCombineAddSub.cpp - platform/external/llvm

blob: 8604b57c7087476056be6f724c86d0ac1546f105 [file] [log] [blame]

Chris Lattner	53a19b7	2010-01-05 07:18:46 +0000	[diff] [blame]	1	//===- InstCombineAddSub.cpp ----------------------------------------------===//
				2	//
				3	// The LLVM Compiler Infrastructure
				4	//
				5	// This file is distributed under the University of Illinois Open Source
				6	// License. See LICENSE.TXT for details.
				7	//
				8	//===----------------------------------------------------------------------===//
				9	//
				10	// This file implements the visit functions for add, fadd, sub, and fsub.
				11	//
				12	//===----------------------------------------------------------------------===//
				13
				14	#include "InstCombine.h"
				15	#include "llvm/Analysis/InstructionSimplify.h"
				16	#include "llvm/Target/TargetData.h"
				17	#include "llvm/Support/GetElementPtrTypeIterator.h"
				18	#include "llvm/Support/PatternMatch.h"
				19	using namespace llvm;
				20	using namespace PatternMatch;
				21
				22	/// AddOne - Add one to a ConstantInt.
				23	static Constant AddOne(Constant C) {
				24	return ConstantExpr::getAdd(C, ConstantInt::get(C->getType(), 1));
				25	}
				26	/// SubOne - Subtract one from a ConstantInt.
				27	static Constant SubOne(ConstantInt C) {
				28	return ConstantInt::get(C->getContext(), C->getValue()-1);
				29	}
				30
				31
				32	// dyn_castFoldableMul - If this value is a multiply that can be folded into
				33	// other computations (because it has a constant operand), return the
				34	// non-constant operand of the multiply, and set CST to point to the multiplier.
				35	// Otherwise, return null.
				36	//
				37	static inline Value dyn_castFoldableMul(Value V, ConstantInt *&CST) {
				38	if (V->hasOneUse() && V->getType()->isInteger())
				39	if (Instruction *I = dyn_cast<Instruction>(V)) {
				40	if (I->getOpcode() == Instruction::Mul)
				41	if ((CST = dyn_cast<ConstantInt>(I->getOperand(1))))
				42	return I->getOperand(0);
				43	if (I->getOpcode() == Instruction::Shl)
				44	if ((CST = dyn_cast<ConstantInt>(I->getOperand(1)))) {
				45	// The multiplier is really 1 << CST.
				46	uint32_t BitWidth = cast<IntegerType>(V->getType())->getBitWidth();
				47	uint32_t CSTVal = CST->getLimitedValue(BitWidth);
				48	CST = ConstantInt::get(V->getType()->getContext(),
				49	APInt(BitWidth, 1).shl(CSTVal));
				50	return I->getOperand(0);
				51	}
				52	}
				53	return 0;
				54	}
				55
				56
				57	/// WillNotOverflowSignedAdd - Return true if we can prove that:
				58	/// (sext (add LHS, RHS)) === (add (sext LHS), (sext RHS))
				59	/// This basically requires proving that the add in the original type would not
				60	/// overflow to change the sign bit or have a carry out.
				61	bool InstCombiner::WillNotOverflowSignedAdd(Value LHS, Value RHS) {
				62	// There are different heuristics we can use for this. Here are some simple
				63	// ones.
				64
				65	// Add has the property that adding any two 2's complement numbers can only
				66	// have one carry bit which can change a sign. As such, if LHS and RHS each
				67	// have at least two sign bits, we know that the addition of the two values
				68	// will sign extend fine.
				69	if (ComputeNumSignBits(LHS) > 1 && ComputeNumSignBits(RHS) > 1)
				70	return true;
				71
				72
				73	// If one of the operands only has one non-zero bit, and if the other operand
				74	// has a known-zero bit in a more significant place than it (not including the
				75	// sign bit) the ripple may go up to and fill the zero, but won't change the
				76	// sign. For example, (X & ~4) + 1.
				77
				78	// TODO: Implement.
				79
				80	return false;
				81	}
				82
				83	Instruction *InstCombiner::visitAdd(BinaryOperator &I) {
				84	bool Changed = SimplifyCommutative(I);
				85	Value LHS = I.getOperand(0), RHS = I.getOperand(1);
				86
				87	if (Value *V = SimplifyAddInst(LHS, RHS, I.hasNoSignedWrap(),
				88	I.hasNoUnsignedWrap(), TD))
				89	return ReplaceInstUsesWith(I, V);
				90
				91
				92	if (Constant *RHSC = dyn_cast<Constant>(RHS)) {
				93	if (ConstantInt *CI = dyn_cast<ConstantInt>(RHSC)) {
				94	// X + (signbit) --> X ^ signbit
				95	const APInt& Val = CI->getValue();
				96	uint32_t BitWidth = Val.getBitWidth();
				97	if (Val == APInt::getSignBit(BitWidth))
				98	return BinaryOperator::CreateXor(LHS, RHS);
				99
				100	// See if SimplifyDemandedBits can simplify this. This handles stuff like
				101	// (X & 254)+1 -> (X&254)\|1
				102	if (SimplifyDemandedInstructionBits(I))
				103	return &I;
				104
				105	// zext(bool) + C -> bool ? C + 1 : C
				106	if (ZExtInst *ZI = dyn_cast<ZExtInst>(LHS))
				107	if (ZI->getSrcTy() == Type::getInt1Ty(I.getContext()))
				108	return SelectInst::Create(ZI->getOperand(0), AddOne(CI), CI);
				109	}
				110
				111	if (isa<PHINode>(LHS))
				112	if (Instruction *NV = FoldOpIntoPhi(I))
				113	return NV;
				114
				115	ConstantInt *XorRHS = 0;
				116	Value *XorLHS = 0;
				117	if (isa<ConstantInt>(RHSC) &&
				118	match(LHS, m_Xor(m_Value(XorLHS), m_ConstantInt(XorRHS)))) {
				119	uint32_t TySizeBits = I.getType()->getScalarSizeInBits();
				120	const APInt& RHSVal = cast<ConstantInt>(RHSC)->getValue();
				121
				122	uint32_t Size = TySizeBits / 2;
				123	APInt C0080Val(APInt(TySizeBits, 1ULL).shl(Size - 1));
				124	APInt CFF80Val(-C0080Val);
				125	do {
				126	if (TySizeBits > Size) {
				127	// If we have ADD(XOR(AND(X, 0xFF), 0x80), 0xF..F80), it's a sext.
				128	// If we have ADD(XOR(AND(X, 0xFF), 0xF..F80), 0x80), it's a sext.
				129	if ((RHSVal == CFF80Val && XorRHS->getValue() == C0080Val) \|\|
				130	(RHSVal == C0080Val && XorRHS->getValue() == CFF80Val)) {
				131	// This is a sign extend if the top bits are known zero.
				132	if (!MaskedValueIsZero(XorLHS,
				133	APInt::getHighBitsSet(TySizeBits, TySizeBits - Size)))
				134	Size = 0; // Not a sign ext, but can't be any others either.
				135	break;
				136	}
				137	}
				138	Size >>= 1;
				139	C0080Val = APIntOps::lshr(C0080Val, Size);
				140	CFF80Val = APIntOps::ashr(CFF80Val, Size);
				141	} while (Size >= 1);
				142
				143	// FIXME: This shouldn't be necessary. When the backends can handle types
				144	// with funny bit widths then this switch statement should be removed. It
				145	// is just here to get the size of the "middle" type back up to something
				146	// that the back ends can handle.
				147	const Type *MiddleType = 0;
				148	switch (Size) {
				149	default: break;
				150	case 32:
				151	case 16:
				152	case 8: MiddleType = IntegerType::get(I.getContext(), Size); break;
				153	}
				154	if (MiddleType) {
				155	Value *NewTrunc = Builder->CreateTrunc(XorLHS, MiddleType, "sext");
				156	return new SExtInst(NewTrunc, I.getType(), I.getName());
				157	}
				158	}
				159	}
				160
				161	if (I.getType() == Type::getInt1Ty(I.getContext()))
				162	return BinaryOperator::CreateXor(LHS, RHS);
				163
				164	if (I.getType()->isInteger()) {
				165	// X + X --> X << 1
				166	if (LHS == RHS)
				167	return BinaryOperator::CreateShl(LHS, ConstantInt::get(I.getType(), 1));
				168
				169	if (Instruction *RHSI = dyn_cast<Instruction>(RHS)) {
				170	if (RHSI->getOpcode() == Instruction::Sub)
				171	if (LHS == RHSI->getOperand(1)) // A + (B - A) --> B
				172	return ReplaceInstUsesWith(I, RHSI->getOperand(0));
				173	}
				174	if (Instruction *LHSI = dyn_cast<Instruction>(LHS)) {
				175	if (LHSI->getOpcode() == Instruction::Sub)
				176	if (RHS == LHSI->getOperand(1)) // (B - A) + A --> B
				177	return ReplaceInstUsesWith(I, LHSI->getOperand(0));
				178	}
				179	}
				180
				181	// -A + B --> B - A
				182	// -A + -B --> -(A + B)
				183	if (Value *LHSV = dyn_castNegVal(LHS)) {
				184	if (LHS->getType()->isIntOrIntVector()) {
				185	if (Value *RHSV = dyn_castNegVal(RHS)) {
				186	Value *NewAdd = Builder->CreateAdd(LHSV, RHSV, "sum");
				187	return BinaryOperator::CreateNeg(NewAdd);
				188	}
				189	}
				190
				191	return BinaryOperator::CreateSub(RHS, LHSV);
				192	}
				193
				194	// A + -B --> A - B
				195	if (!isa<Constant>(RHS))
				196	if (Value *V = dyn_castNegVal(RHS))
				197	return BinaryOperator::CreateSub(LHS, V);
				198
				199
				200	ConstantInt *C2;
				201	if (Value *X = dyn_castFoldableMul(LHS, C2)) {
				202	if (X == RHS) // XC + X --> X (C+1)
				203	return BinaryOperator::CreateMul(RHS, AddOne(C2));
				204
				205	// XC1 + XC2 --> X * (C1+C2)
				206	ConstantInt *C1;
				207	if (X == dyn_castFoldableMul(RHS, C1))
				208	return BinaryOperator::CreateMul(X, ConstantExpr::getAdd(C1, C2));
				209	}
				210
				211	// X + XC --> X (C+1)
				212	if (dyn_castFoldableMul(RHS, C2) == LHS)
				213	return BinaryOperator::CreateMul(LHS, AddOne(C2));
				214
				215	// X + ~X --> -1 since ~X = -X-1
				216	if (match(LHS, m_Not(m_Specific(RHS))) \|\|
				217	match(RHS, m_Not(m_Specific(LHS))))
				218	return ReplaceInstUsesWith(I, Constant::getAllOnesValue(I.getType()));
				219
				220	// A+B --> A\|B iff A and B have no bits set in common.
				221	if (const IntegerType *IT = dyn_cast<IntegerType>(I.getType())) {
				222	APInt Mask = APInt::getAllOnesValue(IT->getBitWidth());
				223	APInt LHSKnownOne(IT->getBitWidth(), 0);
				224	APInt LHSKnownZero(IT->getBitWidth(), 0);
				225	ComputeMaskedBits(LHS, Mask, LHSKnownZero, LHSKnownOne);
				226	if (LHSKnownZero != 0) {
				227	APInt RHSKnownOne(IT->getBitWidth(), 0);
				228	APInt RHSKnownZero(IT->getBitWidth(), 0);
				229	ComputeMaskedBits(RHS, Mask, RHSKnownZero, RHSKnownOne);
				230
				231	// No bits in common -> bitwise or.
				232	if ((LHSKnownZero\|RHSKnownZero).isAllOnesValue())
				233	return BinaryOperator::CreateOr(LHS, RHS);
				234	}
				235	}
				236
				237	// WX + YZ --> W * (X+Z) iff W == Y
				238	if (I.getType()->isIntOrIntVector()) {
				239	Value W, X, Y, Z;
				240	if (match(LHS, m_Mul(m_Value(W), m_Value(X))) &&
				241	match(RHS, m_Mul(m_Value(Y), m_Value(Z)))) {
				242	if (W != Y) {
				243	if (W == Z) {
				244	std::swap(Y, Z);
				245	} else if (Y == X) {
				246	std::swap(W, X);
				247	} else if (X == Z) {
				248	std::swap(Y, Z);
				249	std::swap(W, X);
				250	}
				251	}
				252
				253	if (W == Y) {
				254	Value *NewAdd = Builder->CreateAdd(X, Z, LHS->getName());
				255	return BinaryOperator::CreateMul(W, NewAdd);
				256	}
				257	}
				258	}
				259
				260	if (ConstantInt *CRHS = dyn_cast<ConstantInt>(RHS)) {
				261	Value *X = 0;
				262	if (match(LHS, m_Not(m_Value(X)))) // ~X + C --> (C-1) - X
				263	return BinaryOperator::CreateSub(SubOne(CRHS), X);
				264
				265	// (X & FF00) + xx00 -> (X+xx00) & FF00
				266	if (LHS->hasOneUse() &&
				267	match(LHS, m_And(m_Value(X), m_ConstantInt(C2)))) {
				268	Constant *Anded = ConstantExpr::getAnd(CRHS, C2);
				269	if (Anded == CRHS) {
				270	// See if all bits from the first bit set in the Add RHS up are included
				271	// in the mask. First, get the rightmost bit.
				272	const APInt &AddRHSV = CRHS->getValue();
				273
				274	// Form a mask of all bits from the lowest bit added through the top.
				275	APInt AddRHSHighBits(~((AddRHSV & -AddRHSV)-1));
				276
				277	// See if the and mask includes all of these bits.
				278	APInt AddRHSHighBitsAnd(AddRHSHighBits & C2->getValue());
				279
				280	if (AddRHSHighBits == AddRHSHighBitsAnd) {
				281	// Okay, the xform is safe. Insert the new add pronto.
				282	Value *NewAdd = Builder->CreateAdd(X, CRHS, LHS->getName());
				283	return BinaryOperator::CreateAnd(NewAdd, C2);
				284	}
				285	}
				286	}
				287
				288	// Try to fold constant add into select arguments.
				289	if (SelectInst *SI = dyn_cast<SelectInst>(LHS))
				290	if (Instruction *R = FoldOpIntoSelect(I, SI))
				291	return R;
				292	}
				293
				294	// add (select X 0 (sub n A)) A --> select X A n
				295	{
				296	SelectInst *SI = dyn_cast<SelectInst>(LHS);
				297	Value *A = RHS;
				298	if (!SI) {
				299	SI = dyn_cast<SelectInst>(RHS);
				300	A = LHS;
				301	}
				302	if (SI && SI->hasOneUse()) {
				303	Value *TV = SI->getTrueValue();
				304	Value *FV = SI->getFalseValue();
				305	Value *N;
				306
				307	// Can we fold the add into the argument of the select?
				308	// We check both true and false select arguments for a matching subtract.
				309	if (match(FV, m_Zero()) &&
				310	match(TV, m_Sub(m_Value(N), m_Specific(A))))
				311	// Fold the add into the true select value.
				312	return SelectInst::Create(SI->getCondition(), N, A);
				313	if (match(TV, m_Zero()) &&
				314	match(FV, m_Sub(m_Value(N), m_Specific(A))))
				315	// Fold the add into the false select value.
				316	return SelectInst::Create(SI->getCondition(), A, N);
				317	}
				318	}
				319
				320	// Check for (add (sext x), y), see if we can merge this into an
				321	// integer add followed by a sext.
				322	if (SExtInst *LHSConv = dyn_cast<SExtInst>(LHS)) {
				323	// (add (sext x), cst) --> (sext (add x, cst'))
				324	if (ConstantInt *RHSC = dyn_cast<ConstantInt>(RHS)) {
				325	Constant *CI =
				326	ConstantExpr::getTrunc(RHSC, LHSConv->getOperand(0)->getType());
				327	if (LHSConv->hasOneUse() &&
				328	ConstantExpr::getSExt(CI, I.getType()) == RHSC &&
				329	WillNotOverflowSignedAdd(LHSConv->getOperand(0), CI)) {
				330	// Insert the new, smaller add.
				331	Value *NewAdd = Builder->CreateNSWAdd(LHSConv->getOperand(0),
				332	CI, "addconv");
				333	return new SExtInst(NewAdd, I.getType());
				334	}
				335	}
				336
				337	// (add (sext x), (sext y)) --> (sext (add int x, y))
				338	if (SExtInst *RHSConv = dyn_cast<SExtInst>(RHS)) {
				339	// Only do this if x/y have the same type, if at last one of them has a
				340	// single use (so we don't increase the number of sexts), and if the
				341	// integer add will not overflow.
				342	if (LHSConv->getOperand(0)->getType()==RHSConv->getOperand(0)->getType()&&
				343	(LHSConv->hasOneUse() \|\| RHSConv->hasOneUse()) &&
				344	WillNotOverflowSignedAdd(LHSConv->getOperand(0),
				345	RHSConv->getOperand(0))) {
				346	// Insert the new integer add.
				347	Value *NewAdd = Builder->CreateNSWAdd(LHSConv->getOperand(0),
				348	RHSConv->getOperand(0), "addconv");
				349	return new SExtInst(NewAdd, I.getType());
				350	}
				351	}
				352	}
				353
				354	return Changed ? &I : 0;
				355	}
				356
				357	Instruction *InstCombiner::visitFAdd(BinaryOperator &I) {
				358	bool Changed = SimplifyCommutative(I);
				359	Value LHS = I.getOperand(0), RHS = I.getOperand(1);
				360
				361	if (Constant *RHSC = dyn_cast<Constant>(RHS)) {
				362	// X + 0 --> X
				363	if (ConstantFP *CFP = dyn_cast<ConstantFP>(RHSC)) {
				364	if (CFP->isExactlyValue(ConstantFP::getNegativeZero
				365	(I.getType())->getValueAPF()))
				366	return ReplaceInstUsesWith(I, LHS);
				367	}
				368
				369	if (isa<PHINode>(LHS))
				370	if (Instruction *NV = FoldOpIntoPhi(I))
				371	return NV;
				372	}
				373
				374	// -A + B --> B - A
				375	// -A + -B --> -(A + B)
				376	if (Value *LHSV = dyn_castFNegVal(LHS))
				377	return BinaryOperator::CreateFSub(RHS, LHSV);
				378
				379	// A + -B --> A - B
				380	if (!isa<Constant>(RHS))
				381	if (Value *V = dyn_castFNegVal(RHS))
				382	return BinaryOperator::CreateFSub(LHS, V);
				383
				384	// Check for X+0.0. Simplify it to X if we know X is not -0.0.
				385	if (ConstantFP *CFP = dyn_cast<ConstantFP>(RHS))
				386	if (CFP->getValueAPF().isPosZero() && CannotBeNegativeZero(LHS))
				387	return ReplaceInstUsesWith(I, LHS);
				388
				389	// Check for (add double (sitofp x), y), see if we can merge this into an
				390	// integer add followed by a promotion.
				391	if (SIToFPInst *LHSConv = dyn_cast<SIToFPInst>(LHS)) {
				392	// (add double (sitofp x), fpcst) --> (sitofp (add int x, intcst))
				393	// ... if the constant fits in the integer value. This is useful for things
				394	// like (double)(x & 1234) + 4.0 -> (double)((X & 1234)+4) which no longer
				395	// requires a constant pool load, and generally allows the add to be better
				396	// instcombined.
				397	if (ConstantFP *CFP = dyn_cast<ConstantFP>(RHS)) {
				398	Constant *CI =
				399	ConstantExpr::getFPToSI(CFP, LHSConv->getOperand(0)->getType());
				400	if (LHSConv->hasOneUse() &&
				401	ConstantExpr::getSIToFP(CI, I.getType()) == CFP &&
				402	WillNotOverflowSignedAdd(LHSConv->getOperand(0), CI)) {
				403	// Insert the new integer add.
				404	Value *NewAdd = Builder->CreateNSWAdd(LHSConv->getOperand(0),
				405	CI, "addconv");
				406	return new SIToFPInst(NewAdd, I.getType());
				407	}
				408	}
				409
				410	// (add double (sitofp x), (sitofp y)) --> (sitofp (add int x, y))
				411	if (SIToFPInst *RHSConv = dyn_cast<SIToFPInst>(RHS)) {
				412	// Only do this if x/y have the same type, if at last one of them has a
				413	// single use (so we don't increase the number of int->fp conversions),
				414	// and if the integer add will not overflow.
				415	if (LHSConv->getOperand(0)->getType()==RHSConv->getOperand(0)->getType()&&
				416	(LHSConv->hasOneUse() \|\| RHSConv->hasOneUse()) &&
				417	WillNotOverflowSignedAdd(LHSConv->getOperand(0),
				418	RHSConv->getOperand(0))) {
				419	// Insert the new integer add.
				420	Value *NewAdd = Builder->CreateNSWAdd(LHSConv->getOperand(0),
				421	RHSConv->getOperand(0),"addconv");
				422	return new SIToFPInst(NewAdd, I.getType());
				423	}
				424	}
				425	}
				426
				427	return Changed ? &I : 0;
				428	}
				429
				430
				431	/// EmitGEPOffset - Given a getelementptr instruction/constantexpr, emit the
				432	/// code necessary to compute the offset from the base pointer (without adding
				433	/// in the base pointer). Return the result as a signed integer of intptr size.
				434	Value InstCombiner::EmitGEPOffset(User GEP) {
				435	TargetData &TD = *getTargetData();
				436	gep_type_iterator GTI = gep_type_begin(GEP);
				437	const Type *IntPtrTy = TD.getIntPtrType(GEP->getContext());
				438	Value *Result = Constant::getNullValue(IntPtrTy);
				439
				440	// Build a mask for high order bits.
				441	unsigned IntPtrWidth = TD.getPointerSizeInBits();
				442	uint64_t PtrSizeMask = ~0ULL >> (64-IntPtrWidth);
				443
				444	for (User::op_iterator i = GEP->op_begin() + 1, e = GEP->op_end(); i != e;
				445	++i, ++GTI) {
				446	Value Op = i;
				447	uint64_t Size = TD.getTypeAllocSize(GTI.getIndexedType()) & PtrSizeMask;
				448	if (ConstantInt *OpC = dyn_cast<ConstantInt>(Op)) {
				449	if (OpC->isZero()) continue;
				450
				451	// Handle a struct index, which adds its field offset to the pointer.
				452	if (const StructType STy = dyn_cast<StructType>(GTI)) {
				453	Size = TD.getStructLayout(STy)->getElementOffset(OpC->getZExtValue());
				454
				455	Result = Builder->CreateAdd(Result,
				456	ConstantInt::get(IntPtrTy, Size),
				457	GEP->getName()+".offs");
				458	continue;
				459	}
				460
				461	Constant *Scale = ConstantInt::get(IntPtrTy, Size);
				462	Constant *OC =
				463	ConstantExpr::getIntegerCast(OpC, IntPtrTy, true /SExt/);
				464	Scale = ConstantExpr::getMul(OC, Scale);
				465	// Emit an add instruction.
				466	Result = Builder->CreateAdd(Result, Scale, GEP->getName()+".offs");
				467	continue;
				468	}
				469	// Convert to correct type.
				470	if (Op->getType() != IntPtrTy)
				471	Op = Builder->CreateIntCast(Op, IntPtrTy, true, Op->getName()+".c");
				472	if (Size != 1) {
				473	Constant *Scale = ConstantInt::get(IntPtrTy, Size);
				474	// We'll let instcombine(mul) convert this to a shl if possible.
				475	Op = Builder->CreateMul(Op, Scale, GEP->getName()+".idx");
				476	}
				477
				478	// Emit an add instruction.
				479	Result = Builder->CreateAdd(Op, Result, GEP->getName()+".offs");
				480	}
				481	return Result;
				482	}
				483
				484
				485
				486
				487	/// Optimize pointer differences into the same array into a size. Consider:
				488	/// &A[10] - &A[0]: we should compile this to "10". LHS/RHS are the pointer
				489	/// operands to the ptrtoint instructions for the LHS/RHS of the subtract.
				490	///
				491	Value InstCombiner::OptimizePointerDifference(Value LHS, Value *RHS,
				492	const Type *Ty) {
				493	assert(TD && "Must have target data info for this");
				494
				495	// If LHS is a gep based on RHS or RHS is a gep based on LHS, we can optimize
				496	// this.
				497	bool Swapped = false;
				498	GetElementPtrInst *GEP = 0;
				499	ConstantExpr *CstGEP = 0;
				500
				501	// TODO: Could also optimize &A[i] - &A[j] -> "i-j", and "&A.foo[i] - &A.foo".
				502	// For now we require one side to be the base pointer "A" or a constant
				503	// expression derived from it.
				504	if (GetElementPtrInst *LHSGEP = dyn_cast<GetElementPtrInst>(LHS)) {
				505	// (gep X, ...) - X
				506	if (LHSGEP->getOperand(0) == RHS) {
				507	GEP = LHSGEP;
				508	Swapped = false;
				509	} else if (ConstantExpr *CE = dyn_cast<ConstantExpr>(RHS)) {
				510	// (gep X, ...) - (ce_gep X, ...)
				511	if (CE->getOpcode() == Instruction::GetElementPtr &&
				512	LHSGEP->getOperand(0) == CE->getOperand(0)) {
				513	CstGEP = CE;
				514	GEP = LHSGEP;
				515	Swapped = false;
				516	}
				517	}
				518	}
				519
				520	if (GetElementPtrInst *RHSGEP = dyn_cast<GetElementPtrInst>(RHS)) {
				521	// X - (gep X, ...)
				522	if (RHSGEP->getOperand(0) == LHS) {
				523	GEP = RHSGEP;
				524	Swapped = true;
				525	} else if (ConstantExpr *CE = dyn_cast<ConstantExpr>(LHS)) {
				526	// (ce_gep X, ...) - (gep X, ...)
				527	if (CE->getOpcode() == Instruction::GetElementPtr &&
				528	RHSGEP->getOperand(0) == CE->getOperand(0)) {
				529	CstGEP = CE;
				530	GEP = RHSGEP;
				531	Swapped = true;
				532	}
				533	}
				534	}
				535
				536	if (GEP == 0)
				537	return 0;
				538
				539	// Emit the offset of the GEP and an intptr_t.
				540	Value *Result = EmitGEPOffset(GEP);
				541
				542	// If we had a constant expression GEP on the other side offsetting the
				543	// pointer, subtract it from the offset we have.
				544	if (CstGEP) {
				545	Value *CstOffset = EmitGEPOffset(CstGEP);
				546	Result = Builder->CreateSub(Result, CstOffset);
				547	}
				548
				549
				550	// If we have p - gep(p, ...) then we have to negate the result.
				551	if (Swapped)
				552	Result = Builder->CreateNeg(Result, "diff.neg");
				553
				554	return Builder->CreateIntCast(Result, Ty, true);
				555	}
				556
				557
				558	Instruction *InstCombiner::visitSub(BinaryOperator &I) {
				559	Value Op0 = I.getOperand(0), Op1 = I.getOperand(1);
				560
				561	if (Op0 == Op1) // sub X, X -> 0
				562	return ReplaceInstUsesWith(I, Constant::getNullValue(I.getType()));
				563
				564	// If this is a 'B = x-(-A)', change to B = x+A. This preserves NSW/NUW.
				565	if (Value *V = dyn_castNegVal(Op1)) {
				566	BinaryOperator *Res = BinaryOperator::CreateAdd(Op0, V);
				567	Res->setHasNoSignedWrap(I.hasNoSignedWrap());
				568	Res->setHasNoUnsignedWrap(I.hasNoUnsignedWrap());
				569	return Res;
				570	}
				571
				572	if (isa<UndefValue>(Op0))
				573	return ReplaceInstUsesWith(I, Op0); // undef - X -> undef
				574	if (isa<UndefValue>(Op1))
				575	return ReplaceInstUsesWith(I, Op1); // X - undef -> undef
				576	if (I.getType() == Type::getInt1Ty(I.getContext()))
				577	return BinaryOperator::CreateXor(Op0, Op1);
				578
				579	if (ConstantInt *C = dyn_cast<ConstantInt>(Op0)) {
				580	// Replace (-1 - A) with (~A).
				581	if (C->isAllOnesValue())
				582	return BinaryOperator::CreateNot(Op1);
				583
				584	// C - ~X == X + (1+C)
				585	Value *X = 0;
				586	if (match(Op1, m_Not(m_Value(X))))
				587	return BinaryOperator::CreateAdd(X, AddOne(C));
				588
				589	// -(X >>u 31) -> (X >>s 31)
				590	// -(X >>s 31) -> (X >>u 31)
				591	if (C->isZero()) {
				592	if (BinaryOperator *SI = dyn_cast<BinaryOperator>(Op1)) {
				593	if (SI->getOpcode() == Instruction::LShr) {
				594	if (ConstantInt *CU = dyn_cast<ConstantInt>(SI->getOperand(1))) {
				595	// Check to see if we are shifting out everything but the sign bit.
				596	if (CU->getLimitedValue(SI->getType()->getPrimitiveSizeInBits()) ==
				597	SI->getType()->getPrimitiveSizeInBits()-1) {
				598	// Ok, the transformation is safe. Insert AShr.
				599	return BinaryOperator::Create(Instruction::AShr,
				600	SI->getOperand(0), CU, SI->getName());
				601	}
				602	}
				603	} else if (SI->getOpcode() == Instruction::AShr) {
				604	if (ConstantInt *CU = dyn_cast<ConstantInt>(SI->getOperand(1))) {
				605	// Check to see if we are shifting out everything but the sign bit.
				606	if (CU->getLimitedValue(SI->getType()->getPrimitiveSizeInBits()) ==
				607	SI->getType()->getPrimitiveSizeInBits()-1) {
				608	// Ok, the transformation is safe. Insert LShr.
				609	return BinaryOperator::CreateLShr(
				610	SI->getOperand(0), CU, SI->getName());
				611	}
				612	}
				613	}
				614	}
				615	}
				616
				617	// Try to fold constant sub into select arguments.
				618	if (SelectInst *SI = dyn_cast<SelectInst>(Op1))
				619	if (Instruction *R = FoldOpIntoSelect(I, SI))
				620	return R;
				621
				622	// C - zext(bool) -> bool ? C - 1 : C
				623	if (ZExtInst *ZI = dyn_cast<ZExtInst>(Op1))
				624	if (ZI->getSrcTy() == Type::getInt1Ty(I.getContext()))
				625	return SelectInst::Create(ZI->getOperand(0), SubOne(C), C);
				626	}
				627
				628	if (BinaryOperator *Op1I = dyn_cast<BinaryOperator>(Op1)) {
				629	if (Op1I->getOpcode() == Instruction::Add) {
				630	if (Op1I->getOperand(0) == Op0) // X-(X+Y) == -Y
				631	return BinaryOperator::CreateNeg(Op1I->getOperand(1),
				632	I.getName());
				633	else if (Op1I->getOperand(1) == Op0) // X-(Y+X) == -Y
				634	return BinaryOperator::CreateNeg(Op1I->getOperand(0),
				635	I.getName());
				636	else if (ConstantInt *CI1 = dyn_cast<ConstantInt>(I.getOperand(0))) {
				637	if (ConstantInt *CI2 = dyn_cast<ConstantInt>(Op1I->getOperand(1)))
				638	// C1-(X+C2) --> (C1-C2)-X
				639	return BinaryOperator::CreateSub(
				640	ConstantExpr::getSub(CI1, CI2), Op1I->getOperand(0));
				641	}
				642	}
				643
				644	if (Op1I->hasOneUse()) {
				645	// Replace (x - (y - z)) with (x + (z - y)) if the (y - z) subexpression
				646	// is not used by anyone else...
				647	//
				648	if (Op1I->getOpcode() == Instruction::Sub) {
				649	// Swap the two operands of the subexpr...
				650	Value IIOp0 = Op1I->getOperand(0), IIOp1 = Op1I->getOperand(1);
				651	Op1I->setOperand(0, IIOp1);
				652	Op1I->setOperand(1, IIOp0);
				653
				654	// Create the new top level add instruction...
				655	return BinaryOperator::CreateAdd(Op0, Op1);
				656	}
				657
				658	// Replace (A - (A & B)) with (A & ~B) if this is the only use of (A&B)...
				659	//
				660	if (Op1I->getOpcode() == Instruction::And &&
				661	(Op1I->getOperand(0) == Op0 \|\| Op1I->getOperand(1) == Op0)) {
				662	Value *OtherOp = Op1I->getOperand(Op1I->getOperand(0) == Op0);
				663
				664	Value *NewNot = Builder->CreateNot(OtherOp, "B.not");
				665	return BinaryOperator::CreateAnd(Op0, NewNot);
				666	}
				667
				668	// 0 - (X sdiv C) -> (X sdiv -C)
				669	if (Op1I->getOpcode() == Instruction::SDiv)
				670	if (ConstantInt *CSI = dyn_cast<ConstantInt>(Op0))
				671	if (CSI->isZero())
				672	if (Constant *DivRHS = dyn_cast<Constant>(Op1I->getOperand(1)))
				673	return BinaryOperator::CreateSDiv(Op1I->getOperand(0),
				674	ConstantExpr::getNeg(DivRHS));
				675
				676	// X - XC --> X (1-C)
				677	ConstantInt *C2 = 0;
				678	if (dyn_castFoldableMul(Op1I, C2) == Op0) {
				679	Constant *CP1 =
				680	ConstantExpr::getSub(ConstantInt::get(I.getType(), 1),
				681	C2);
				682	return BinaryOperator::CreateMul(Op0, CP1);
				683	}
				684	}
				685	}
				686
				687	if (BinaryOperator *Op0I = dyn_cast<BinaryOperator>(Op0)) {
				688	if (Op0I->getOpcode() == Instruction::Add) {
				689	if (Op0I->getOperand(0) == Op1) // (Y+X)-Y == X
				690	return ReplaceInstUsesWith(I, Op0I->getOperand(1));
				691	else if (Op0I->getOperand(1) == Op1) // (X+Y)-Y == X
				692	return ReplaceInstUsesWith(I, Op0I->getOperand(0));
				693	} else if (Op0I->getOpcode() == Instruction::Sub) {
				694	if (Op0I->getOperand(0) == Op1) // (X-Y)-X == -Y
				695	return BinaryOperator::CreateNeg(Op0I->getOperand(1),
				696	I.getName());
				697	}
				698	}
				699
				700	ConstantInt *C1;
				701	if (Value *X = dyn_castFoldableMul(Op0, C1)) {
				702	if (X == Op1) // XC - X --> X (C-1)
				703	return BinaryOperator::CreateMul(Op1, SubOne(C1));
				704
				705	ConstantInt C2; // XC1 - XC2 -> X (C1-C2)
				706	if (X == dyn_castFoldableMul(Op1, C2))
				707	return BinaryOperator::CreateMul(X, ConstantExpr::getSub(C1, C2));
				708	}
				709
				710	// Optimize pointer differences into the same array into a size. Consider:
				711	// &A[10] - &A[0]: we should compile this to "10".
				712	if (TD) {
				713	Value LHSOp, RHSOp;
				714	if (match(Op0, m_PtrToInt(m_Value(LHSOp))) &&
				715	match(Op1, m_PtrToInt(m_Value(RHSOp))))
				716	if (Value *Res = OptimizePointerDifference(LHSOp, RHSOp, I.getType()))
				717	return ReplaceInstUsesWith(I, Res);
				718
				719	// trunc(p)-trunc(q) -> trunc(p-q)
				720	if (match(Op0, m_Trunc(m_PtrToInt(m_Value(LHSOp)))) &&
				721	match(Op1, m_Trunc(m_PtrToInt(m_Value(RHSOp)))))
				722	if (Value *Res = OptimizePointerDifference(LHSOp, RHSOp, I.getType()))
				723	return ReplaceInstUsesWith(I, Res);
				724	}
				725
				726	return 0;
				727	}
				728
				729	Instruction *InstCombiner::visitFSub(BinaryOperator &I) {
				730	Value Op0 = I.getOperand(0), Op1 = I.getOperand(1);
				731
				732	// If this is a 'B = x-(-A)', change to B = x+A...
				733	if (Value *V = dyn_castFNegVal(Op1))
				734	return BinaryOperator::CreateFAdd(Op0, V);
				735
				736	if (BinaryOperator *Op1I = dyn_cast<BinaryOperator>(Op1)) {
				737	if (Op1I->getOpcode() == Instruction::FAdd) {
				738	if (Op1I->getOperand(0) == Op0) // X-(X+Y) == -Y
				739	return BinaryOperator::CreateFNeg(Op1I->getOperand(1),
				740	I.getName());
				741	else if (Op1I->getOperand(1) == Op0) // X-(Y+X) == -Y
				742	return BinaryOperator::CreateFNeg(Op1I->getOperand(0),
				743	I.getName());
				744	}
				745	}
				746
				747	return 0;
				748	}