Chris Lattner | 83bf288 | 2004-04-18 05:20:17 +0000 | [diff] [blame] | 1 | //===-- LoopUnroll.cpp - Loop unroller pass -------------------------------===// |
Misha Brukman | fd93908 | 2005-04-21 23:48:37 +0000 | [diff] [blame] | 2 | // |
Chris Lattner | 83bf288 | 2004-04-18 05:20:17 +0000 | [diff] [blame] | 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
Chris Lattner | 4ee451d | 2007-12-29 20:36:04 +0000 | [diff] [blame] | 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
Misha Brukman | fd93908 | 2005-04-21 23:48:37 +0000 | [diff] [blame] | 7 | // |
Chris Lattner | 83bf288 | 2004-04-18 05:20:17 +0000 | [diff] [blame] | 8 | //===----------------------------------------------------------------------===// |
| 9 | // |
| 10 | // This pass implements a simple loop unroller. It works best when loops have |
| 11 | // been canonicalized by the -indvars pass, allowing it to determine the trip |
| 12 | // counts of loops easily. |
Chris Lattner | 83bf288 | 2004-04-18 05:20:17 +0000 | [diff] [blame] | 13 | //===----------------------------------------------------------------------===// |
| 14 | |
| 15 | #define DEBUG_TYPE "loop-unroll" |
Dan Gohman | 45b3197 | 2008-05-14 00:24:14 +0000 | [diff] [blame] | 16 | #include "llvm/IntrinsicInst.h" |
Chris Lattner | 83bf288 | 2004-04-18 05:20:17 +0000 | [diff] [blame] | 17 | #include "llvm/Transforms/Scalar.h" |
Chris Lattner | 83bf288 | 2004-04-18 05:20:17 +0000 | [diff] [blame] | 18 | #include "llvm/Analysis/LoopInfo.h" |
Devang Patel | 3f1a1e0 | 2007-03-07 01:38:05 +0000 | [diff] [blame] | 19 | #include "llvm/Analysis/LoopPass.h" |
Reid Spencer | 9133fe2 | 2007-02-05 23:32:05 +0000 | [diff] [blame] | 20 | #include "llvm/Support/Compiler.h" |
Reid Spencer | 551ccae | 2004-09-01 22:55:40 +0000 | [diff] [blame] | 21 | #include "llvm/Support/CommandLine.h" |
| 22 | #include "llvm/Support/Debug.h" |
Daniel Dunbar | ce63ffb | 2009-07-25 00:23:56 +0000 | [diff] [blame] | 23 | #include "llvm/Support/raw_ostream.h" |
Dan Gohman | 45b3197 | 2008-05-14 00:24:14 +0000 | [diff] [blame] | 24 | #include "llvm/Transforms/Utils/UnrollLoop.h" |
Duncan Sands | 1a2d667 | 2008-05-16 09:30:00 +0000 | [diff] [blame] | 25 | #include <climits> |
Chris Lattner | 83bf288 | 2004-04-18 05:20:17 +0000 | [diff] [blame] | 26 | |
Dan Gohman | 45b3197 | 2008-05-14 00:24:14 +0000 | [diff] [blame] | 27 | using namespace llvm; |
Chris Lattner | 83bf288 | 2004-04-18 05:20:17 +0000 | [diff] [blame] | 28 | |
Dan Gohman | 844731a | 2008-05-13 00:00:25 +0000 | [diff] [blame] | 29 | static cl::opt<unsigned> |
| 30 | UnrollThreshold("unroll-threshold", cl::init(100), cl::Hidden, |
| 31 | cl::desc("The cut-off point for automatic loop unrolling")); |
| 32 | |
| 33 | static cl::opt<unsigned> |
| 34 | UnrollCount("unroll-count", cl::init(0), cl::Hidden, |
| 35 | cl::desc("Use this unroll count for all loops, for testing purposes")); |
| 36 | |
Matthijs Kooijman | 75cf9cc | 2008-07-29 13:21:23 +0000 | [diff] [blame] | 37 | static cl::opt<bool> |
| 38 | UnrollAllowPartial("unroll-allow-partial", cl::init(false), cl::Hidden, |
| 39 | cl::desc("Allows loops to be partially unrolled until " |
| 40 | "-unroll-threshold loop size is reached.")); |
| 41 | |
Chris Lattner | 0e5f499 | 2006-12-19 21:40:18 +0000 | [diff] [blame] | 42 | namespace { |
Devang Patel | 3f1a1e0 | 2007-03-07 01:38:05 +0000 | [diff] [blame] | 43 | class VISIBILITY_HIDDEN LoopUnroll : public LoopPass { |
Chris Lattner | 83bf288 | 2004-04-18 05:20:17 +0000 | [diff] [blame] | 44 | public: |
Devang Patel | 1997473 | 2007-05-03 01:11:54 +0000 | [diff] [blame] | 45 | static char ID; // Pass ID, replacement for typeid |
Dan Gohman | ae73dc1 | 2008-09-04 17:05:41 +0000 | [diff] [blame] | 46 | LoopUnroll() : LoopPass(&ID) {} |
Devang Patel | 794fd75 | 2007-05-01 21:15:47 +0000 | [diff] [blame] | 47 | |
Dan Gohman | c767844 | 2007-05-11 20:53:41 +0000 | [diff] [blame] | 48 | /// A magic value for use with the Threshold parameter to indicate |
| 49 | /// that the loop unroll should be performed regardless of how much |
| 50 | /// code expansion would result. |
| 51 | static const unsigned NoThreshold = UINT_MAX; |
| 52 | |
Devang Patel | 3f1a1e0 | 2007-03-07 01:38:05 +0000 | [diff] [blame] | 53 | bool runOnLoop(Loop *L, LPPassManager &LPM); |
Chris Lattner | 83bf288 | 2004-04-18 05:20:17 +0000 | [diff] [blame] | 54 | |
| 55 | /// This transformation requires natural loop information & requires that |
| 56 | /// loop preheaders be inserted into the CFG... |
| 57 | /// |
| 58 | virtual void getAnalysisUsage(AnalysisUsage &AU) const { |
Chris Lattner | 83bf288 | 2004-04-18 05:20:17 +0000 | [diff] [blame] | 59 | AU.addRequiredID(LoopSimplifyID); |
Owen Anderson | 3b53c4e | 2006-08-24 21:28:19 +0000 | [diff] [blame] | 60 | AU.addRequiredID(LCSSAID); |
Chris Lattner | 83bf288 | 2004-04-18 05:20:17 +0000 | [diff] [blame] | 61 | AU.addRequired<LoopInfo>(); |
Owen Anderson | 3b53c4e | 2006-08-24 21:28:19 +0000 | [diff] [blame] | 62 | AU.addPreservedID(LCSSAID); |
Chris Lattner | 9c2cc46 | 2004-04-18 05:38:37 +0000 | [diff] [blame] | 63 | AU.addPreserved<LoopInfo>(); |
Devang Patel | 98260a4 | 2008-07-03 07:04:22 +0000 | [diff] [blame] | 64 | // FIXME: Loop unroll requires LCSSA. And LCSSA requires dom info. |
| 65 | // If loop unroll does not preserve dom info then LCSSA pass on next |
| 66 | // loop will receive invalid dom info. |
| 67 | // For now, recreate dom info, if loop is unrolled. |
| 68 | AU.addPreserved<DominatorTree>(); |
| 69 | AU.addPreserved<DominanceFrontier>(); |
Chris Lattner | 83bf288 | 2004-04-18 05:20:17 +0000 | [diff] [blame] | 70 | } |
| 71 | }; |
Chris Lattner | 83bf288 | 2004-04-18 05:20:17 +0000 | [diff] [blame] | 72 | } |
| 73 | |
Dan Gohman | 844731a | 2008-05-13 00:00:25 +0000 | [diff] [blame] | 74 | char LoopUnroll::ID = 0; |
| 75 | static RegisterPass<LoopUnroll> X("loop-unroll", "Unroll loops"); |
| 76 | |
Daniel Dunbar | 394f044 | 2008-10-22 23:32:42 +0000 | [diff] [blame] | 77 | Pass *llvm::createLoopUnrollPass() { return new LoopUnroll(); } |
Chris Lattner | 83bf288 | 2004-04-18 05:20:17 +0000 | [diff] [blame] | 78 | |
Dan Gohman | f742c23 | 2007-05-08 15:14:19 +0000 | [diff] [blame] | 79 | /// ApproximateLoopSize - Approximate the size of the loop. |
Chris Lattner | 83bf288 | 2004-04-18 05:20:17 +0000 | [diff] [blame] | 80 | static unsigned ApproximateLoopSize(const Loop *L) { |
| 81 | unsigned Size = 0; |
Dan Gohman | 9b78763 | 2008-06-22 20:18:58 +0000 | [diff] [blame] | 82 | for (Loop::block_iterator I = L->block_begin(), E = L->block_end(); |
| 83 | I != E; ++I) { |
| 84 | BasicBlock *BB = *I; |
Chris Lattner | 83bf288 | 2004-04-18 05:20:17 +0000 | [diff] [blame] | 85 | Instruction *Term = BB->getTerminator(); |
| 86 | for (BasicBlock::iterator I = BB->begin(), E = BB->end(); I != E; ++I) { |
| 87 | if (isa<PHINode>(I) && BB == L->getHeader()) { |
| 88 | // Ignore PHI nodes in the header. |
| 89 | } else if (I->hasOneUse() && I->use_back() == Term) { |
| 90 | // Ignore instructions only used by the loop terminator. |
Reid Spencer | 3ed469c | 2006-11-02 20:25:50 +0000 | [diff] [blame] | 91 | } else if (isa<DbgInfoIntrinsic>(I)) { |
Jeff Cohen | 9d80930 | 2005-04-23 21:38:35 +0000 | [diff] [blame] | 92 | // Ignore debug instructions |
Dale Johannesen | 23300aa | 2009-04-20 22:19:33 +0000 | [diff] [blame] | 93 | } else if (isa<GetElementPtrInst>(I) && I->hasOneUse()) { |
| 94 | // Ignore GEP as they generally are subsumed into a load or store. |
Devang Patel | b176038 | 2008-03-17 23:41:20 +0000 | [diff] [blame] | 95 | } else if (isa<CallInst>(I)) { |
Devang Patel | ac3844d | 2008-03-19 23:05:52 +0000 | [diff] [blame] | 96 | // Estimate size overhead introduced by call instructions which |
| 97 | // is higher than other instructions. Here 3 and 10 are magic |
| 98 | // numbers that help one isolated test case from PR2067 without |
| 99 | // negatively impacting measured benchmarks. |
Devang Patel | b176038 | 2008-03-17 23:41:20 +0000 | [diff] [blame] | 100 | if (isa<IntrinsicInst>(I)) |
| 101 | Size = Size + 3; |
| 102 | else |
| 103 | Size = Size + 10; |
Chris Lattner | 83bf288 | 2004-04-18 05:20:17 +0000 | [diff] [blame] | 104 | } else { |
| 105 | ++Size; |
| 106 | } |
| 107 | |
| 108 | // TODO: Ignore expressions derived from PHI and constants if inval of phi |
| 109 | // is a constant, or if operation is associative. This will get induction |
| 110 | // variables. |
| 111 | } |
| 112 | } |
| 113 | |
| 114 | return Size; |
| 115 | } |
| 116 | |
Devang Patel | 3f1a1e0 | 2007-03-07 01:38:05 +0000 | [diff] [blame] | 117 | bool LoopUnroll::runOnLoop(Loop *L, LPPassManager &LPM) { |
Dan Gohman | c767844 | 2007-05-11 20:53:41 +0000 | [diff] [blame] | 118 | assert(L->isLCSSAForm()); |
Dan Gohman | 45b3197 | 2008-05-14 00:24:14 +0000 | [diff] [blame] | 119 | LoopInfo *LI = &getAnalysis<LoopInfo>(); |
Dan Gohman | c767844 | 2007-05-11 20:53:41 +0000 | [diff] [blame] | 120 | |
Dan Gohman | 1cc0096 | 2007-05-08 15:19:19 +0000 | [diff] [blame] | 121 | BasicBlock *Header = L->getHeader(); |
Daniel Dunbar | ce63ffb | 2009-07-25 00:23:56 +0000 | [diff] [blame] | 122 | DEBUG(errs() << "Loop Unroll: F[" << Header->getParent()->getName() |
| 123 | << "] Loop %" << Header->getName() << "\n"); |
Mike Stump | 02efa78 | 2009-07-27 23:14:11 +0000 | [diff] [blame] | 124 | (void)Header; |
Dan Gohman | c767844 | 2007-05-11 20:53:41 +0000 | [diff] [blame] | 125 | |
Dan Gohman | 45b3197 | 2008-05-14 00:24:14 +0000 | [diff] [blame] | 126 | // Find trip count |
| 127 | unsigned TripCount = L->getSmallConstantTripCount(); |
| 128 | unsigned Count = UnrollCount; |
Andreas Bolka | f1f2dc2 | 2009-08-13 02:40:50 +0000 | [diff] [blame] | 129 | |
Dan Gohman | c767844 | 2007-05-11 20:53:41 +0000 | [diff] [blame] | 130 | // Automatically select an unroll count. |
| 131 | if (Count == 0) { |
| 132 | // Conservative heuristic: if we know the trip count, see if we can |
| 133 | // completely unroll (subject to the threshold, checked below); otherwise |
Andreas Bolka | f1f2dc2 | 2009-08-13 02:40:50 +0000 | [diff] [blame] | 134 | // try to find greatest modulo of the trip count which is still under |
Matthijs Kooijman | 75cf9cc | 2008-07-29 13:21:23 +0000 | [diff] [blame] | 135 | // threshold value. |
Andreas Bolka | ec40eb4 | 2009-08-13 03:00:57 +0000 | [diff] [blame^] | 136 | if (TripCount == 0) |
Dan Gohman | c767844 | 2007-05-11 20:53:41 +0000 | [diff] [blame] | 137 | return false; |
Andreas Bolka | ec40eb4 | 2009-08-13 03:00:57 +0000 | [diff] [blame^] | 138 | Count = TripCount; |
Dan Gohman | c767844 | 2007-05-11 20:53:41 +0000 | [diff] [blame] | 139 | } |
| 140 | |
Dan Gohman | c767844 | 2007-05-11 20:53:41 +0000 | [diff] [blame] | 141 | // Enforce the threshold. |
Dan Gohman | 45b3197 | 2008-05-14 00:24:14 +0000 | [diff] [blame] | 142 | if (UnrollThreshold != NoThreshold) { |
Dan Gohman | c767844 | 2007-05-11 20:53:41 +0000 | [diff] [blame] | 143 | unsigned LoopSize = ApproximateLoopSize(L); |
Andreas Bolka | 52e539c | 2009-08-13 02:45:03 +0000 | [diff] [blame] | 144 | DEBUG(errs() << " Loop Size = " << LoopSize << "\n"); |
Dan Gohman | c767844 | 2007-05-11 20:53:41 +0000 | [diff] [blame] | 145 | uint64_t Size = (uint64_t)LoopSize*Count; |
Dan Gohman | 45b3197 | 2008-05-14 00:24:14 +0000 | [diff] [blame] | 146 | if (TripCount != 1 && Size > UnrollThreshold) { |
Andreas Bolka | 52e539c | 2009-08-13 02:45:03 +0000 | [diff] [blame] | 147 | DEBUG(errs() << " Too large to fully unroll with count: " << Count |
| 148 | << " because size: " << Size << ">" << UnrollThreshold << "\n"); |
Andreas Bolka | ec40eb4 | 2009-08-13 03:00:57 +0000 | [diff] [blame^] | 149 | if (!UnrollAllowPartial) { |
Andreas Bolka | 52e539c | 2009-08-13 02:45:03 +0000 | [diff] [blame] | 150 | DEBUG(errs() << " will not try to unroll partially because " |
| 151 | << "-unroll-allow-partial not given\n"); |
Matthijs Kooijman | 75cf9cc | 2008-07-29 13:21:23 +0000 | [diff] [blame] | 152 | return false; |
| 153 | } |
Andreas Bolka | ec40eb4 | 2009-08-13 03:00:57 +0000 | [diff] [blame^] | 154 | // Reduce unroll count to be modulo of TripCount for partial unrolling |
| 155 | Count = UnrollThreshold / LoopSize; |
| 156 | while (Count != 0 && TripCount%Count != 0) { |
| 157 | Count--; |
| 158 | } |
| 159 | if (Count < 2) { |
| 160 | DEBUG(errs() << " could not unroll partially\n"); |
| 161 | return false; |
| 162 | } |
| 163 | DEBUG(errs() << " partially unrolling with count: " << Count << "\n"); |
Dan Gohman | c767844 | 2007-05-11 20:53:41 +0000 | [diff] [blame] | 164 | } |
| 165 | } |
| 166 | |
Dan Gohman | 45b3197 | 2008-05-14 00:24:14 +0000 | [diff] [blame] | 167 | // Unroll the loop. |
Devang Patel | 98260a4 | 2008-07-03 07:04:22 +0000 | [diff] [blame] | 168 | Function *F = L->getHeader()->getParent(); |
Dan Gohman | 45b3197 | 2008-05-14 00:24:14 +0000 | [diff] [blame] | 169 | if (!UnrollLoop(L, Count, LI, &LPM)) |
| 170 | return false; |
Dan Gohman | c767844 | 2007-05-11 20:53:41 +0000 | [diff] [blame] | 171 | |
Devang Patel | 98260a4 | 2008-07-03 07:04:22 +0000 | [diff] [blame] | 172 | // FIXME: Reconstruct dom info, because it is not preserved properly. |
Duncan Sands | 1465d61 | 2009-01-28 13:14:17 +0000 | [diff] [blame] | 173 | DominatorTree *DT = getAnalysisIfAvailable<DominatorTree>(); |
Devang Patel | 98260a4 | 2008-07-03 07:04:22 +0000 | [diff] [blame] | 174 | if (DT) { |
| 175 | DT->runOnFunction(*F); |
Duncan Sands | 1465d61 | 2009-01-28 13:14:17 +0000 | [diff] [blame] | 176 | DominanceFrontier *DF = getAnalysisIfAvailable<DominanceFrontier>(); |
Devang Patel | 98260a4 | 2008-07-03 07:04:22 +0000 | [diff] [blame] | 177 | if (DF) |
| 178 | DF->runOnFunction(*F); |
| 179 | } |
Chris Lattner | 83bf288 | 2004-04-18 05:20:17 +0000 | [diff] [blame] | 180 | return true; |
| 181 | } |