Blame - llvm/lib/Transforms/Scalar/TailRecursionElimination.cpp - toolchain/llvm-project

blob: 2bdb316dbcba9890ab3fd7f7afc0ad1806906f78 [file] [log] [blame]

Chris Lattner	2e9014c	2003-09-20 05:03:31 +0000	[diff] [blame]	1	//===- TailRecursionElimination.cpp - Eliminate Tail Calls ----------------===//
John Criswell	482202a	2003-10-20 19:43:21 +0000	[diff] [blame]	2	//
				3	// The LLVM Compiler Infrastructure
				4	//
				5	// This file was developed by the LLVM research group and is distributed under
				6	// the University of Illinois Open Source License. See LICENSE.TXT for details.
				7	//
				8	//===----------------------------------------------------------------------===//
Chris Lattner	2e9014c	2003-09-20 05:03:31 +0000	[diff] [blame]	9	//
Chris Lattner	a7b6f3a	2003-12-08 05:34:54 +0000	[diff] [blame]	10	// This file transforms calls of the current function (self recursion) followed
				11	// by a return instruction with a branch to the entry of the function, creating
				12	// a loop. This pass also implements the following extensions to the basic
				13	// algorithm:
Chris Lattner	2e9014c	2003-09-20 05:03:31 +0000	[diff] [blame]	14	//
Chris Lattner	a7b6f3a	2003-12-08 05:34:54 +0000	[diff] [blame]	15	// 1. Trivial instructions between the call and return do not prevent the
				16	// transformation from taking place, though currently the analysis cannot
				17	// support moving any really useful instructions (only dead ones).
Chris Lattner	198e620	2003-12-08 23:19:26 +0000	[diff] [blame]	18	// 2. This pass transforms functions that are prevented from being tail
				19	// recursive by an associative expression to use an accumulator variable,
				20	// thus compiling the typical naive factorial or 'fib' implementation into
				21	// efficient code.
Chris Lattner	2e9014c	2003-09-20 05:03:31 +0000	[diff] [blame]	22	//
Chris Lattner	a7b6f3a	2003-12-08 05:34:54 +0000	[diff] [blame]	23	// There are several improvements that could be made:
				24	//
				25	// 1. If the function has any alloca instructions, these instructions will be
				26	// moved out of the entry block of the function, causing them to be
				27	// evaluated each time through the tail recursion. Safely keeping allocas
				28	// in the entry block requires analysis to proves that the tail-called
				29	// function does not read or write the stack object.
Chris Lattner	2e9014c	2003-09-20 05:03:31 +0000	[diff] [blame]	30	// 2. Tail recursion is only performed if the call immediately preceeds the
Chris Lattner	a7b6f3a	2003-12-08 05:34:54 +0000	[diff] [blame]	31	// return instruction. It's possible that there could be a jump between
				32	// the call and the return.
Chris Lattner	2e9014c	2003-09-20 05:03:31 +0000	[diff] [blame]	33	// 3. TRE is only performed if the function returns void or if the return
				34	// returns the result returned by the call. It is possible, but unlikely,
				35	// that the return returns something else (like constant 0), and can still
				36	// be TRE'd. It can be TRE'd if ALL OTHER return instructions in the
				37	// function return the exact same value.
Chris Lattner	a7b6f3a	2003-12-08 05:34:54 +0000	[diff] [blame]	38	// 4. There can be intervening operations between the call and the return that
				39	// prevent the TRE from occurring. For example, there could be GEP's and
				40	// stores to memory that will not be read or written by the call. This
				41	// requires some substantial analysis (such as with DSA) to prove safe to
				42	// move ahead of the call, but doing so could allow many more TREs to be
				43	// performed, for example in TreeAdd/TreeAlloc from the treeadd benchmark.
Chris Lattner	2e9014c	2003-09-20 05:03:31 +0000	[diff] [blame]	44	//
				45	//===----------------------------------------------------------------------===//
				46
Chris Lattner	0016085	2003-09-20 05:14:13 +0000	[diff] [blame]	47	#include "llvm/Transforms/Scalar.h"
Chris Lattner	2e9014c	2003-09-20 05:03:31 +0000	[diff] [blame]	48	#include "llvm/DerivedTypes.h"
				49	#include "llvm/Function.h"
				50	#include "llvm/Instructions.h"
				51	#include "llvm/Pass.h"
Chris Lattner	198e620	2003-12-08 23:19:26 +0000	[diff] [blame]	52	#include "llvm/Support/CFG.h"
Chris Lattner	2e9014c	2003-09-20 05:03:31 +0000	[diff] [blame]	53	#include "Support/Statistic.h"
Chris Lattner	2af5172	2003-11-20 18:25:24 +0000	[diff] [blame]	54	using namespace llvm;
Brian Gaeke	960707c	2003-11-11 22:41:34 +0000	[diff] [blame]	55
Chris Lattner	2e9014c	2003-09-20 05:03:31 +0000	[diff] [blame]	56	namespace {
				57	Statistic<> NumEliminated("tailcallelim", "Number of tail calls removed");
Chris Lattner	198e620	2003-12-08 23:19:26 +0000	[diff] [blame]	58	Statistic<> NumAccumAdded("tailcallelim","Number of accumulators introduced");
Chris Lattner	2e9014c	2003-09-20 05:03:31 +0000	[diff] [blame]	59
				60	struct TailCallElim : public FunctionPass {
				61	virtual bool runOnFunction(Function &F);
Chris Lattner	a7b6f3a	2003-12-08 05:34:54 +0000	[diff] [blame]	62
				63	private:
				64	bool ProcessReturningBlock(ReturnInst RI, BasicBlock &OldEntry,
				65	std::vector<PHINode*> &ArgumentPHIs);
				66	bool CanMoveAboveCall(Instruction I, CallInst CI);
Chris Lattner	198e620	2003-12-08 23:19:26 +0000	[diff] [blame]	67	Value CanTransformAccumulatorRecursion(Instruction I, CallInst *CI);
Chris Lattner	2e9014c	2003-09-20 05:03:31 +0000	[diff] [blame]	68	};
				69	RegisterOpt<TailCallElim> X("tailcallelim", "Tail Call Elimination");
				70	}
				71
Brian Gaeke	960707c	2003-11-11 22:41:34 +0000	[diff] [blame]	72	// Public interface to the TailCallElimination pass
Chris Lattner	2af5172	2003-11-20 18:25:24 +0000	[diff] [blame]	73	FunctionPass *llvm::createTailCallEliminationPass() {
				74	return new TailCallElim();
				75	}
Chris Lattner	0016085	2003-09-20 05:14:13 +0000	[diff] [blame]	76
Chris Lattner	2e9014c	2003-09-20 05:03:31 +0000	[diff] [blame]	77
				78	bool TailCallElim::runOnFunction(Function &F) {
				79	// If this function is a varargs function, we won't be able to PHI the args
				80	// right, so don't even try to convert it...
				81	if (F.getFunctionType()->isVarArg()) return false;
				82
				83	BasicBlock *OldEntry = 0;
				84	std::vector<PHINode*> ArgumentPHIs;
				85	bool MadeChange = false;
				86
				87	// Loop over the function, looking for any returning blocks...
				88	for (Function::iterator BB = F.begin(), E = F.end(); BB != E; ++BB)
				89	if (ReturnInst *Ret = dyn_cast<ReturnInst>(BB->getTerminator()))
Chris Lattner	a7b6f3a	2003-12-08 05:34:54 +0000	[diff] [blame]	90	MadeChange \|= ProcessReturningBlock(Ret, OldEntry, ArgumentPHIs);
Chris Lattner	2e9014c	2003-09-20 05:03:31 +0000	[diff] [blame]	91
Chris Lattner	50663a1	2003-12-08 23:37:35 +0000	[diff] [blame]	92	// If we eliminated any tail recursions, it's possible that we inserted some
				93	// silly PHI nodes which just merge an initial value (the incoming operand)
				94	// with themselves. Check to see if we did and clean up our mess if so. This
				95	// occurs when a function passes an argument straight through to its tail
				96	// call.
				97	if (!ArgumentPHIs.empty()) {
				98	unsigned NumIncoming = ArgumentPHIs[0]->getNumIncomingValues();
				99	for (unsigned i = 0, e = ArgumentPHIs.size(); i != e; ++i) {
				100	PHINode *PN = ArgumentPHIs[i];
				101	Value *V = 0;
				102	for (unsigned op = 0, e = NumIncoming; op != e; ++op) {
				103	Value *Op = PN->getIncomingValue(op);
				104	if (Op != PN) {
				105	if (V == 0) {
				106	V = Op; // First value seen?
				107	} else if (V != Op) {
				108	V = 0;
				109	break;
				110	}
				111	}
				112	}
				113
				114	// If the PHI Node is a dynamic constant, replace it with the value it is.
				115	if (V) {
				116	PN->replaceAllUsesWith(V);
				117	PN->getParent()->getInstList().erase(PN);
				118	}
				119	}
				120	}
				121
Chris Lattner	2e9014c	2003-09-20 05:03:31 +0000	[diff] [blame]	122	return MadeChange;
				123	}
Chris Lattner	a7b6f3a	2003-12-08 05:34:54 +0000	[diff] [blame]	124
				125
Chris Lattner	198e620	2003-12-08 23:19:26 +0000	[diff] [blame]	126	/// CanMoveAboveCall - Return true if it is safe to move the specified
				127	/// instruction from after the call to before the call, assuming that all
				128	/// instructions between the call and this instruction are movable.
				129	///
Chris Lattner	a7b6f3a	2003-12-08 05:34:54 +0000	[diff] [blame]	130	bool TailCallElim::CanMoveAboveCall(Instruction I, CallInst CI) {
				131	// FIXME: We can move load/store/call/free instructions above the call if the
				132	// call does not mod/ref the memory location being processed.
				133	if (I->mayWriteToMemory() \|\| isa<LoadInst>(I))
				134	return false;
				135
				136	// Otherwise, if this is a side-effect free instruction, check to make sure
				137	// that it does not use the return value of the call. If it doesn't use the
				138	// return value of the call, it must only use things that are defined before
				139	// the call, or movable instructions between the call and the instruction
				140	// itself.
				141	for (unsigned i = 0, e = I->getNumOperands(); i != e; ++i)
				142	if (I->getOperand(i) == CI)
				143	return false;
				144	return true;
				145	}
				146
				147
Chris Lattner	198e620	2003-12-08 23:19:26 +0000	[diff] [blame]	148	/// CanTransformAccumulatorRecursion - If the specified instruction can be
				149	/// transformed using accumulator recursion elimination, return the constant
				150	/// which is the start of the accumulator value. Otherwise return null.
				151	///
				152	Value TailCallElim::CanTransformAccumulatorRecursion(Instruction I,
				153	CallInst *CI) {
				154	if (!I->isAssociative()) return 0;
				155	assert(I->getNumOperands() == 2 &&
				156	"Associative operations should have 2 args!");
				157
				158	// Exactly one operand should be the result of the call instruction...
				159	if (I->getOperand(0) == CI && I->getOperand(1) == CI \|\|
				160	I->getOperand(0) != CI && I->getOperand(1) != CI)
				161	return 0;
				162
				163	// The only user of this instruction we allow is a single return instruction.
				164	if (!I->hasOneUse() \|\| !isa<ReturnInst>(I->use_back()))
				165	return 0;
				166
				167	// Ok, now we have to check all of the other return instructions in this
				168	// function. If they return non-constants or differing values, then we cannot
				169	// transform the function safely.
				170	Value *ReturnedValue = 0;
				171	Function *F = CI->getParent()->getParent();
				172
				173	for (Function::iterator BBI = F->begin(), E = F->end(); BBI != E; ++BBI)
				174	if (ReturnInst *RI = dyn_cast<ReturnInst>(BBI->getTerminator())) {
				175	Value *RetOp = RI->getOperand(0);
Chris Lattner	50663a1	2003-12-08 23:37:35 +0000	[diff] [blame]	176	if (RetOp != I) { // Ignore the one returning I.
				177	// We can only perform this transformation if the value returned is
				178	// evaluatable at the start of the initial invocation of the function,
				179	// instead of at the end of the evaluation.
				180	//
				181	// We currently handle static constants and arguments that are not
				182	// modified as part of the recursion.
				183	if (!isa<Constant>(RetOp)) { // Constants are always ok
				184	// Check to see if this is an immutable argument, if so, the value
				185	// will be available to initialize the accumulator.
				186	if (Argument *Arg = dyn_cast<Argument>(RetOp)) {
				187	// Figure out which argument number this is...
				188	unsigned ArgNo = 0;
				189	for (Function::aiterator AI = F->abegin(); &*AI != Arg; ++AI)
				190	++ArgNo;
				191
				192	// If we are passing this argument into call as the corresponding
				193	// argument operand, then the argument is dynamically constant.
				194	// Otherwise, we cannot transform this function safely.
				195	if (CI->getOperand(ArgNo+1) != Arg)
				196	return 0;
Chris Lattner	198e620	2003-12-08 23:19:26 +0000	[diff] [blame]	197
Chris Lattner	50663a1	2003-12-08 23:37:35 +0000	[diff] [blame]	198	} else {
				199	// Not a constant or immutable argument, we can't safely transform.
				200	return 0;
				201	}
				202	}
				203
				204	if (ReturnedValue && RetOp != ReturnedValue)
				205	return 0; // Cannot transform if differing values are returned.
				206	ReturnedValue = RetOp;
Chris Lattner	198e620	2003-12-08 23:19:26 +0000	[diff] [blame]	207	}
				208	}
Chris Lattner	50663a1	2003-12-08 23:37:35 +0000	[diff] [blame]	209
Chris Lattner	198e620	2003-12-08 23:19:26 +0000	[diff] [blame]	210	// Ok, if we passed this battery of tests, we can perform accumulator
				211	// recursion elimination.
				212	return ReturnedValue;
				213	}
				214
Chris Lattner	a7b6f3a	2003-12-08 05:34:54 +0000	[diff] [blame]	215	bool TailCallElim::ProcessReturningBlock(ReturnInst Ret, BasicBlock &OldEntry,
				216	std::vector<PHINode*> &ArgumentPHIs) {
				217	BasicBlock *BB = Ret->getParent();
				218	Function *F = BB->getParent();
				219
				220	if (&BB->front() == Ret) // Make sure there is something before the ret...
				221	return false;
				222
				223	// Scan backwards from the return, checking to see if there is a tail call in
				224	// this block. If so, set CI to it.
				225	CallInst *CI;
				226	BasicBlock::iterator BBI = Ret;
				227	while (1) {
				228	CI = dyn_cast<CallInst>(BBI);
				229	if (CI && CI->getCalledFunction() == F)
				230	break;
				231
				232	if (BBI == BB->begin())
				233	return false; // Didn't find a potential tail call.
				234	--BBI;
				235	}
				236
Chris Lattner	198e620	2003-12-08 23:19:26 +0000	[diff] [blame]	237	// If we are introducing accumulator recursion to eliminate associative
				238	// operations after the call instruction, this variable contains the initial
				239	// value for the accumulator. If this value is set, we actually perform
				240	// accumulator recursion elimination instead of simple tail recursion
				241	// elimination.
				242	Value *AccumulatorRecursionEliminationInitVal = 0;
				243	Instruction *AccumulatorRecursionInstr = 0;
				244
Chris Lattner	a7b6f3a	2003-12-08 05:34:54 +0000	[diff] [blame]	245	// Ok, we found a potential tail call. We can currently only transform the
				246	// tail call if all of the instructions between the call and the return are
				247	// movable to above the call itself, leaving the call next to the return.
				248	// Check that this is the case now.
				249	for (BBI = CI, ++BBI; &*BBI != Ret; ++BBI)
Chris Lattner	198e620	2003-12-08 23:19:26 +0000	[diff] [blame]	250	if (!CanMoveAboveCall(BBI, CI)) {
				251	// If we can't move the instruction above the call, it might be because it
				252	// is an associative operation that could be tranformed using accumulator
				253	// recursion elimination. Check to see if this is the case, and if so,
				254	// remember the initial accumulator value for later.
				255	if ((AccumulatorRecursionEliminationInitVal =
				256	CanTransformAccumulatorRecursion(BBI, CI))) {
				257	// Yes, this is accumulator recursion. Remember which instruction
				258	// accumulates.
				259	AccumulatorRecursionInstr = BBI;
				260	} else {
				261	return false; // Otherwise, we cannot eliminate the tail recursion!
				262	}
				263	}
Chris Lattner	a7b6f3a	2003-12-08 05:34:54 +0000	[diff] [blame]	264
				265	// We can only transform call/return pairs that either ignore the return value
				266	// of the call and return void, or return the value returned by the tail call.
Chris Lattner	198e620	2003-12-08 23:19:26 +0000	[diff] [blame]	267	if (Ret->getNumOperands() != 0 && Ret->getReturnValue() != CI &&
				268	AccumulatorRecursionEliminationInitVal == 0)
Chris Lattner	a7b6f3a	2003-12-08 05:34:54 +0000	[diff] [blame]	269	return false;
				270
				271	// OK! We can transform this tail call. If this is the first one found,
				272	// create the new entry block, allowing us to branch back to the old entry.
				273	if (OldEntry == 0) {
				274	OldEntry = &F->getEntryBlock();
				275	std::string OldName = OldEntry->getName(); OldEntry->setName("tailrecurse");
				276	BasicBlock *NewEntry = new BasicBlock(OldName, OldEntry);
				277	new BranchInst(OldEntry, NewEntry);
				278
				279	// Now that we have created a new block, which jumps to the entry
				280	// block, insert a PHI node for each argument of the function.
				281	// For now, we initialize each PHI to only have the real arguments
				282	// which are passed in.
				283	Instruction *InsertPos = OldEntry->begin();
				284	for (Function::aiterator I = F->abegin(), E = F->aend(); I != E; ++I) {
				285	PHINode *PN = new PHINode(I->getType(), I->getName()+".tr", InsertPos);
				286	I->replaceAllUsesWith(PN); // Everyone use the PHI node now!
				287	PN->addIncoming(I, NewEntry);
				288	ArgumentPHIs.push_back(PN);
				289	}
				290	}
				291
				292	// Ok, now that we know we have a pseudo-entry block WITH all of the
				293	// required PHI nodes, add entries into the PHI node for the actual
				294	// parameters passed into the tail-recursive call.
				295	for (unsigned i = 0, e = CI->getNumOperands()-1; i != e; ++i)
				296	ArgumentPHIs[i]->addIncoming(CI->getOperand(i+1), BB);
				297
Chris Lattner	198e620	2003-12-08 23:19:26 +0000	[diff] [blame]	298	// If we are introducing an accumulator variable to eliminate the recursion,
				299	// do so now. Note that we _know_ that no subsequent tail recursion
				300	// eliminations will happen on this function because of the way the
				301	// accumulator recursion predicate is set up.
				302	//
				303	if (AccumulatorRecursionEliminationInitVal) {
				304	Instruction *AccRecInstr = AccumulatorRecursionInstr;
				305	// Start by inserting a new PHI node for the accumulator.
				306	PHINode *AccPN = new PHINode(AccRecInstr->getType(), "accumulator.tr",
				307	OldEntry->begin());
				308
				309	// Loop over all of the predecessors of the tail recursion block. For the
				310	// real entry into the function we seed the PHI with the initial value,
				311	// computed earlier. For any other existing branches to this block (due to
				312	// other tail recursions eliminated) the accumulator is not modified.
				313	// Because we haven't added the branch in the current block to OldEntry yet,
				314	// it will not show up as a predecessor.
				315	for (pred_iterator PI = pred_begin(OldEntry), PE = pred_end(OldEntry);
				316	PI != PE; ++PI) {
				317	if (*PI == &F->getEntryBlock())
				318	AccPN->addIncoming(AccumulatorRecursionEliminationInitVal, *PI);
				319	else
				320	AccPN->addIncoming(AccPN, *PI);
				321	}
				322
				323	// Add an incoming argument for the current block, which is computed by our
				324	// associative accumulator instruction.
				325	AccPN->addIncoming(AccRecInstr, BB);
				326
				327	// Next, rewrite the accumulator recursion instruction so that it does not
				328	// use the result of the call anymore, instead, use the PHI node we just
				329	// inserted.
				330	AccRecInstr->setOperand(AccRecInstr->getOperand(0) != CI, AccPN);
				331
				332	// Finally, rewrite any return instructions in the program to return the PHI
				333	// node instead of the "initval" that they do currently. This loop will
				334	// actually rewrite the return value we are destroying, but that's ok.
				335	for (Function::iterator BBI = F->begin(), E = F->end(); BBI != E; ++BBI)
				336	if (ReturnInst *RI = dyn_cast<ReturnInst>(BBI->getTerminator()))
				337	RI->setOperand(0, AccPN);
				338	++NumAccumAdded;
				339	}
				340
Chris Lattner	a7b6f3a	2003-12-08 05:34:54 +0000	[diff] [blame]	341	// Now that all of the PHI nodes are in place, remove the call and
				342	// ret instructions, replacing them with an unconditional branch.
				343	new BranchInst(OldEntry, Ret);
				344	BB->getInstList().erase(Ret); // Remove return.
				345	BB->getInstList().erase(CI); // Remove call.
Chris Lattner	198e620	2003-12-08 23:19:26 +0000	[diff] [blame]	346	++NumEliminated;
Chris Lattner	a7b6f3a	2003-12-08 05:34:54 +0000	[diff] [blame]	347	return true;
				348	}