Chris Lattner | 83bf288 | 2004-04-18 05:20:17 +0000 | [diff] [blame] | 1 | //===-- LoopUnroll.cpp - Loop unroller pass -------------------------------===// |
Misha Brukman | fd93908 | 2005-04-21 23:48:37 +0000 | [diff] [blame] | 2 | // |
Chris Lattner | 83bf288 | 2004-04-18 05:20:17 +0000 | [diff] [blame] | 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
Chris Lattner | 4ee451d | 2007-12-29 20:36:04 +0000 | [diff] [blame] | 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
Misha Brukman | fd93908 | 2005-04-21 23:48:37 +0000 | [diff] [blame] | 7 | // |
Chris Lattner | 83bf288 | 2004-04-18 05:20:17 +0000 | [diff] [blame] | 8 | //===----------------------------------------------------------------------===// |
| 9 | // |
| 10 | // This pass implements a simple loop unroller. It works best when loops have |
| 11 | // been canonicalized by the -indvars pass, allowing it to determine the trip |
| 12 | // counts of loops easily. |
Chris Lattner | 83bf288 | 2004-04-18 05:20:17 +0000 | [diff] [blame] | 13 | //===----------------------------------------------------------------------===// |
| 14 | |
| 15 | #define DEBUG_TYPE "loop-unroll" |
| 16 | #include "llvm/Transforms/Scalar.h" |
Chris Lattner | d9e0797 | 2011-01-02 07:35:53 +0000 | [diff] [blame] | 17 | #include "llvm/Analysis/CodeMetrics.h" |
Chandler Carruth | d04a8d4 | 2012-12-03 16:50:05 +0000 | [diff] [blame] | 18 | #include "llvm/Analysis/LoopPass.h" |
Dan Gohman | 052f000 | 2010-07-26 18:11:16 +0000 | [diff] [blame] | 19 | #include "llvm/Analysis/ScalarEvolution.h" |
Chandler Carruth | a5157e6 | 2013-01-21 13:04:33 +0000 | [diff] [blame] | 20 | #include "llvm/Analysis/TargetTransformInfo.h" |
Chandler Carruth | 0b8c9a8 | 2013-01-02 11:36:10 +0000 | [diff] [blame] | 21 | #include "llvm/IR/DataLayout.h" |
| 22 | #include "llvm/IR/IntrinsicInst.h" |
Reid Spencer | 551ccae | 2004-09-01 22:55:40 +0000 | [diff] [blame] | 23 | #include "llvm/Support/CommandLine.h" |
| 24 | #include "llvm/Support/Debug.h" |
Daniel Dunbar | ce63ffb | 2009-07-25 00:23:56 +0000 | [diff] [blame] | 25 | #include "llvm/Support/raw_ostream.h" |
Dan Gohman | 45b3197 | 2008-05-14 00:24:14 +0000 | [diff] [blame] | 26 | #include "llvm/Transforms/Utils/UnrollLoop.h" |
Duncan Sands | 1a2d667 | 2008-05-16 09:30:00 +0000 | [diff] [blame] | 27 | #include <climits> |
Chris Lattner | 83bf288 | 2004-04-18 05:20:17 +0000 | [diff] [blame] | 28 | |
Dan Gohman | 45b3197 | 2008-05-14 00:24:14 +0000 | [diff] [blame] | 29 | using namespace llvm; |
Chris Lattner | 83bf288 | 2004-04-18 05:20:17 +0000 | [diff] [blame] | 30 | |
Dan Gohman | 844731a | 2008-05-13 00:00:25 +0000 | [diff] [blame] | 31 | static cl::opt<unsigned> |
Owen Anderson | 8ea298a | 2010-09-10 17:57:00 +0000 | [diff] [blame] | 32 | UnrollThreshold("unroll-threshold", cl::init(150), cl::Hidden, |
Dan Gohman | 844731a | 2008-05-13 00:00:25 +0000 | [diff] [blame] | 33 | cl::desc("The cut-off point for automatic loop unrolling")); |
| 34 | |
| 35 | static cl::opt<unsigned> |
| 36 | UnrollCount("unroll-count", cl::init(0), cl::Hidden, |
| 37 | cl::desc("Use this unroll count for all loops, for testing purposes")); |
| 38 | |
Matthijs Kooijman | 75cf9cc | 2008-07-29 13:21:23 +0000 | [diff] [blame] | 39 | static cl::opt<bool> |
| 40 | UnrollAllowPartial("unroll-allow-partial", cl::init(false), cl::Hidden, |
| 41 | cl::desc("Allows loops to be partially unrolled until " |
| 42 | "-unroll-threshold loop size is reached.")); |
| 43 | |
Andrew Trick | 5d73448 | 2011-12-09 06:19:40 +0000 | [diff] [blame] | 44 | static cl::opt<bool> |
| 45 | UnrollRuntime("unroll-runtime", cl::ZeroOrMore, cl::init(false), cl::Hidden, |
| 46 | cl::desc("Unroll loops with run-time trip counts")); |
| 47 | |
Chris Lattner | 0e5f499 | 2006-12-19 21:40:18 +0000 | [diff] [blame] | 48 | namespace { |
Chris Lattner | 3e8b663 | 2009-09-02 06:11:42 +0000 | [diff] [blame] | 49 | class LoopUnroll : public LoopPass { |
Chris Lattner | 83bf288 | 2004-04-18 05:20:17 +0000 | [diff] [blame] | 50 | public: |
Devang Patel | 1997473 | 2007-05-03 01:11:54 +0000 | [diff] [blame] | 51 | static char ID; // Pass ID, replacement for typeid |
Junjie Gu | 32644d9 | 2011-04-13 16:15:29 +0000 | [diff] [blame] | 52 | LoopUnroll(int T = -1, int C = -1, int P = -1) : LoopPass(ID) { |
Chris Lattner | b3b1571 | 2011-04-14 02:27:25 +0000 | [diff] [blame] | 53 | CurrentThreshold = (T == -1) ? UnrollThreshold : unsigned(T); |
| 54 | CurrentCount = (C == -1) ? UnrollCount : unsigned(C); |
Junjie Gu | 32644d9 | 2011-04-13 16:15:29 +0000 | [diff] [blame] | 55 | CurrentAllowPartial = (P == -1) ? UnrollAllowPartial : (bool)P; |
| 56 | |
| 57 | UserThreshold = (T != -1) || (UnrollThreshold.getNumOccurrences() > 0); |
Hal Finkel | 4f7e2c3 | 2013-09-11 19:25:43 +0000 | [diff] [blame^] | 58 | UserAllowPartial = (P != -1) || |
| 59 | (UnrollAllowPartial.getNumOccurrences() > 0); |
| 60 | UserCount = (C != -1) || (UnrollCount.getNumOccurrences() > 0); |
Andrew Trick | ba03377 | 2011-07-23 00:29:16 +0000 | [diff] [blame] | 61 | |
Owen Anderson | 081c34b | 2010-10-19 17:21:58 +0000 | [diff] [blame] | 62 | initializeLoopUnrollPass(*PassRegistry::getPassRegistry()); |
| 63 | } |
Devang Patel | 794fd75 | 2007-05-01 21:15:47 +0000 | [diff] [blame] | 64 | |
Dan Gohman | c767844 | 2007-05-11 20:53:41 +0000 | [diff] [blame] | 65 | /// A magic value for use with the Threshold parameter to indicate |
| 66 | /// that the loop unroll should be performed regardless of how much |
| 67 | /// code expansion would result. |
| 68 | static const unsigned NoThreshold = UINT_MAX; |
Andrew Trick | ba03377 | 2011-07-23 00:29:16 +0000 | [diff] [blame] | 69 | |
Owen Anderson | e9f1882 | 2010-09-07 23:15:30 +0000 | [diff] [blame] | 70 | // Threshold to use when optsize is specified (and there is no |
| 71 | // explicit -unroll-threshold). |
| 72 | static const unsigned OptSizeUnrollThreshold = 50; |
Andrew Trick | ba03377 | 2011-07-23 00:29:16 +0000 | [diff] [blame] | 73 | |
Andrew Trick | 5d73448 | 2011-12-09 06:19:40 +0000 | [diff] [blame] | 74 | // Default unroll count for loops with run-time trip count if |
| 75 | // -unroll-count is not set |
| 76 | static const unsigned UnrollRuntimeCount = 8; |
| 77 | |
Junjie Gu | 32644d9 | 2011-04-13 16:15:29 +0000 | [diff] [blame] | 78 | unsigned CurrentCount; |
Owen Anderson | e9f1882 | 2010-09-07 23:15:30 +0000 | [diff] [blame] | 79 | unsigned CurrentThreshold; |
Junjie Gu | 32644d9 | 2011-04-13 16:15:29 +0000 | [diff] [blame] | 80 | bool CurrentAllowPartial; |
Hal Finkel | 4f7e2c3 | 2013-09-11 19:25:43 +0000 | [diff] [blame^] | 81 | bool UserCount; // CurrentCount is user-specified. |
Junjie Gu | 32644d9 | 2011-04-13 16:15:29 +0000 | [diff] [blame] | 82 | bool UserThreshold; // CurrentThreshold is user-specified. |
Hal Finkel | 4f7e2c3 | 2013-09-11 19:25:43 +0000 | [diff] [blame^] | 83 | bool UserAllowPartial; // CurrentAllowPartial is user-specified. |
Dan Gohman | c767844 | 2007-05-11 20:53:41 +0000 | [diff] [blame] | 84 | |
Devang Patel | 3f1a1e0 | 2007-03-07 01:38:05 +0000 | [diff] [blame] | 85 | bool runOnLoop(Loop *L, LPPassManager &LPM); |
Chris Lattner | 83bf288 | 2004-04-18 05:20:17 +0000 | [diff] [blame] | 86 | |
| 87 | /// This transformation requires natural loop information & requires that |
| 88 | /// loop preheaders be inserted into the CFG... |
| 89 | /// |
| 90 | virtual void getAnalysisUsage(AnalysisUsage &AU) const { |
Chris Lattner | 83bf288 | 2004-04-18 05:20:17 +0000 | [diff] [blame] | 91 | AU.addRequired<LoopInfo>(); |
Chris Lattner | 9c2cc46 | 2004-04-18 05:38:37 +0000 | [diff] [blame] | 92 | AU.addPreserved<LoopInfo>(); |
Dan Gohman | 052f000 | 2010-07-26 18:11:16 +0000 | [diff] [blame] | 93 | AU.addRequiredID(LoopSimplifyID); |
| 94 | AU.addPreservedID(LoopSimplifyID); |
| 95 | AU.addRequiredID(LCSSAID); |
| 96 | AU.addPreservedID(LCSSAID); |
Andrew Trick | 39f4029 | 2011-08-10 04:29:49 +0000 | [diff] [blame] | 97 | AU.addRequired<ScalarEvolution>(); |
Chris Lattner | 9377901 | 2010-08-29 17:21:35 +0000 | [diff] [blame] | 98 | AU.addPreserved<ScalarEvolution>(); |
Chandler Carruth | a5157e6 | 2013-01-21 13:04:33 +0000 | [diff] [blame] | 99 | AU.addRequired<TargetTransformInfo>(); |
Devang Patel | 98260a4 | 2008-07-03 07:04:22 +0000 | [diff] [blame] | 100 | // FIXME: Loop unroll requires LCSSA. And LCSSA requires dom info. |
| 101 | // If loop unroll does not preserve dom info then LCSSA pass on next |
| 102 | // loop will receive invalid dom info. |
| 103 | // For now, recreate dom info, if loop is unrolled. |
| 104 | AU.addPreserved<DominatorTree>(); |
Chris Lattner | 83bf288 | 2004-04-18 05:20:17 +0000 | [diff] [blame] | 105 | } |
| 106 | }; |
Chris Lattner | 83bf288 | 2004-04-18 05:20:17 +0000 | [diff] [blame] | 107 | } |
| 108 | |
Dan Gohman | 844731a | 2008-05-13 00:00:25 +0000 | [diff] [blame] | 109 | char LoopUnroll::ID = 0; |
Owen Anderson | 2ab36d3 | 2010-10-12 19:48:12 +0000 | [diff] [blame] | 110 | INITIALIZE_PASS_BEGIN(LoopUnroll, "loop-unroll", "Unroll loops", false, false) |
Chandler Carruth | a5157e6 | 2013-01-21 13:04:33 +0000 | [diff] [blame] | 111 | INITIALIZE_AG_DEPENDENCY(TargetTransformInfo) |
Owen Anderson | 2ab36d3 | 2010-10-12 19:48:12 +0000 | [diff] [blame] | 112 | INITIALIZE_PASS_DEPENDENCY(LoopInfo) |
| 113 | INITIALIZE_PASS_DEPENDENCY(LoopSimplify) |
| 114 | INITIALIZE_PASS_DEPENDENCY(LCSSA) |
Devang Patel | 9be72d4 | 2011-10-19 23:56:07 +0000 | [diff] [blame] | 115 | INITIALIZE_PASS_DEPENDENCY(ScalarEvolution) |
Owen Anderson | 2ab36d3 | 2010-10-12 19:48:12 +0000 | [diff] [blame] | 116 | INITIALIZE_PASS_END(LoopUnroll, "loop-unroll", "Unroll loops", false, false) |
Dan Gohman | 844731a | 2008-05-13 00:00:25 +0000 | [diff] [blame] | 117 | |
Junjie Gu | 32644d9 | 2011-04-13 16:15:29 +0000 | [diff] [blame] | 118 | Pass *llvm::createLoopUnrollPass(int Threshold, int Count, int AllowPartial) { |
Junjie Gu | 7133b85 | 2011-04-13 16:45:49 +0000 | [diff] [blame] | 119 | return new LoopUnroll(Threshold, Count, AllowPartial); |
Junjie Gu | 32644d9 | 2011-04-13 16:15:29 +0000 | [diff] [blame] | 120 | } |
Chris Lattner | 83bf288 | 2004-04-18 05:20:17 +0000 | [diff] [blame] | 121 | |
Dan Gohman | f742c23 | 2007-05-08 15:14:19 +0000 | [diff] [blame] | 122 | /// ApproximateLoopSize - Approximate the size of the loop. |
Andrew Trick | b2ab2fa | 2011-10-01 01:39:05 +0000 | [diff] [blame] | 123 | static unsigned ApproximateLoopSize(const Loop *L, unsigned &NumCalls, |
Chandler Carruth | a5157e6 | 2013-01-21 13:04:33 +0000 | [diff] [blame] | 124 | bool &NotDuplicatable, |
| 125 | const TargetTransformInfo &TTI) { |
Dan Gohman | a2aabe3 | 2009-10-31 14:54:17 +0000 | [diff] [blame] | 126 | CodeMetrics Metrics; |
Dan Gohman | 9b78763 | 2008-06-22 20:18:58 +0000 | [diff] [blame] | 127 | for (Loop::block_iterator I = L->block_begin(), E = L->block_end(); |
Dan Gohman | a2aabe3 | 2009-10-31 14:54:17 +0000 | [diff] [blame] | 128 | I != E; ++I) |
Chandler Carruth | a5157e6 | 2013-01-21 13:04:33 +0000 | [diff] [blame] | 129 | Metrics.analyzeBasicBlock(*I, TTI); |
Owen Anderson | f9a26b8 | 2010-09-09 20:32:23 +0000 | [diff] [blame] | 130 | NumCalls = Metrics.NumInlineCandidates; |
James Molloy | 67ae135 | 2012-12-20 16:04:27 +0000 | [diff] [blame] | 131 | NotDuplicatable = Metrics.notDuplicatable; |
Andrew Trick | ba03377 | 2011-07-23 00:29:16 +0000 | [diff] [blame] | 132 | |
Owen Anderson | 6add2fb | 2010-09-09 19:07:31 +0000 | [diff] [blame] | 133 | unsigned LoopSize = Metrics.NumInsts; |
Andrew Trick | ba03377 | 2011-07-23 00:29:16 +0000 | [diff] [blame] | 134 | |
Owen Anderson | 6add2fb | 2010-09-09 19:07:31 +0000 | [diff] [blame] | 135 | // Don't allow an estimate of size zero. This would allows unrolling of loops |
| 136 | // with huge iteration counts, which is a compile time problem even if it's |
| 137 | // not a problem for code quality. |
| 138 | if (LoopSize == 0) LoopSize = 1; |
Andrew Trick | ba03377 | 2011-07-23 00:29:16 +0000 | [diff] [blame] | 139 | |
Owen Anderson | 6add2fb | 2010-09-09 19:07:31 +0000 | [diff] [blame] | 140 | return LoopSize; |
Chris Lattner | 83bf288 | 2004-04-18 05:20:17 +0000 | [diff] [blame] | 141 | } |
| 142 | |
Devang Patel | 3f1a1e0 | 2007-03-07 01:38:05 +0000 | [diff] [blame] | 143 | bool LoopUnroll::runOnLoop(Loop *L, LPPassManager &LPM) { |
Dan Gohman | 45b3197 | 2008-05-14 00:24:14 +0000 | [diff] [blame] | 144 | LoopInfo *LI = &getAnalysis<LoopInfo>(); |
Andrew Trick | b1831c6 | 2011-08-11 23:36:16 +0000 | [diff] [blame] | 145 | ScalarEvolution *SE = &getAnalysis<ScalarEvolution>(); |
Chandler Carruth | a5157e6 | 2013-01-21 13:04:33 +0000 | [diff] [blame] | 146 | const TargetTransformInfo &TTI = getAnalysis<TargetTransformInfo>(); |
Dan Gohman | c767844 | 2007-05-11 20:53:41 +0000 | [diff] [blame] | 147 | |
Dan Gohman | 1cc0096 | 2007-05-08 15:19:19 +0000 | [diff] [blame] | 148 | BasicBlock *Header = L->getHeader(); |
David Greene | d241e38 | 2010-01-05 01:27:44 +0000 | [diff] [blame] | 149 | DEBUG(dbgs() << "Loop Unroll: F[" << Header->getParent()->getName() |
Daniel Dunbar | ce63ffb | 2009-07-25 00:23:56 +0000 | [diff] [blame] | 150 | << "] Loop %" << Header->getName() << "\n"); |
Mike Stump | 02efa78 | 2009-07-27 23:14:11 +0000 | [diff] [blame] | 151 | (void)Header; |
Andrew Trick | ba03377 | 2011-07-23 00:29:16 +0000 | [diff] [blame] | 152 | |
Hal Finkel | 4f7e2c3 | 2013-09-11 19:25:43 +0000 | [diff] [blame^] | 153 | TargetTransformInfo::UnrollingPreferences UP; |
| 154 | UP.Threshold = CurrentThreshold; |
| 155 | UP.OptSizeThreshold = OptSizeUnrollThreshold; |
| 156 | UP.Count = CurrentCount; |
| 157 | UP.Partial = CurrentAllowPartial; |
| 158 | UP.Runtime = UnrollRuntime; |
| 159 | TTI.getUnrollingPreferences(L, UP); |
| 160 | |
Owen Anderson | e9f1882 | 2010-09-07 23:15:30 +0000 | [diff] [blame] | 161 | // Determine the current unrolling threshold. While this is normally set |
| 162 | // from UnrollThreshold, it is overridden to a smaller value if the current |
| 163 | // function is marked as optimize-for-size, and the unroll threshold was |
| 164 | // not user specified. |
Hal Finkel | 4f7e2c3 | 2013-09-11 19:25:43 +0000 | [diff] [blame^] | 165 | unsigned Threshold = UserThreshold ? CurrentThreshold : UP.Threshold; |
Andrew Trick | ba03377 | 2011-07-23 00:29:16 +0000 | [diff] [blame] | 166 | if (!UserThreshold && |
Bill Wendling | 831737d | 2012-12-30 10:32:01 +0000 | [diff] [blame] | 167 | Header->getParent()->getAttributes(). |
| 168 | hasAttribute(AttributeSet::FunctionIndex, |
| 169 | Attribute::OptimizeForSize)) |
Hal Finkel | 4f7e2c3 | 2013-09-11 19:25:43 +0000 | [diff] [blame^] | 170 | Threshold = UP.OptSizeThreshold; |
Dan Gohman | c767844 | 2007-05-11 20:53:41 +0000 | [diff] [blame] | 171 | |
Andrew Trick | b1831c6 | 2011-08-11 23:36:16 +0000 | [diff] [blame] | 172 | // Find trip count and trip multiple if count is not available |
| 173 | unsigned TripCount = 0; |
Andrew Trick | 2045ce1 | 2011-07-23 00:33:05 +0000 | [diff] [blame] | 174 | unsigned TripMultiple = 1; |
Andrew Trick | ed38f1c | 2011-11-28 19:22:09 +0000 | [diff] [blame] | 175 | // Find "latch trip count". UnrollLoop assumes that control cannot exit |
| 176 | // via the loop latch on any iteration prior to TripCount. The loop may exit |
| 177 | // early via an earlier branch. |
| 178 | BasicBlock *LatchBlock = L->getLoopLatch(); |
| 179 | if (LatchBlock) { |
| 180 | TripCount = SE->getSmallConstantTripCount(L, LatchBlock); |
| 181 | TripMultiple = SE->getSmallConstantTripMultiple(L, LatchBlock); |
Andrew Trick | b1831c6 | 2011-08-11 23:36:16 +0000 | [diff] [blame] | 182 | } |
Hal Finkel | 4f7e2c3 | 2013-09-11 19:25:43 +0000 | [diff] [blame^] | 183 | |
| 184 | bool Runtime = UnrollRuntime.getNumOccurrences() == 0 ? |
| 185 | UP.Runtime : UnrollRuntime; |
| 186 | |
Andrew Trick | 5d73448 | 2011-12-09 06:19:40 +0000 | [diff] [blame] | 187 | // Use a default unroll-count if the user doesn't specify a value |
| 188 | // and the trip count is a run-time value. The default is different |
| 189 | // for run-time or compile-time trip count loops. |
Hal Finkel | 4f7e2c3 | 2013-09-11 19:25:43 +0000 | [diff] [blame^] | 190 | unsigned Count = UserCount ? CurrentCount : UP.Count; |
| 191 | if (Runtime && Count == 0 && TripCount == 0) |
Andrew Trick | 5d73448 | 2011-12-09 06:19:40 +0000 | [diff] [blame] | 192 | Count = UnrollRuntimeCount; |
| 193 | |
Dan Gohman | c767844 | 2007-05-11 20:53:41 +0000 | [diff] [blame] | 194 | if (Count == 0) { |
| 195 | // Conservative heuristic: if we know the trip count, see if we can |
| 196 | // completely unroll (subject to the threshold, checked below); otherwise |
Andreas Bolka | f1f2dc2 | 2009-08-13 02:40:50 +0000 | [diff] [blame] | 197 | // try to find greatest modulo of the trip count which is still under |
Matthijs Kooijman | 75cf9cc | 2008-07-29 13:21:23 +0000 | [diff] [blame] | 198 | // threshold value. |
Andreas Bolka | ec40eb4 | 2009-08-13 03:00:57 +0000 | [diff] [blame] | 199 | if (TripCount == 0) |
Dan Gohman | c767844 | 2007-05-11 20:53:41 +0000 | [diff] [blame] | 200 | return false; |
Andreas Bolka | ec40eb4 | 2009-08-13 03:00:57 +0000 | [diff] [blame] | 201 | Count = TripCount; |
Dan Gohman | c767844 | 2007-05-11 20:53:41 +0000 | [diff] [blame] | 202 | } |
| 203 | |
Dan Gohman | c767844 | 2007-05-11 20:53:41 +0000 | [diff] [blame] | 204 | // Enforce the threshold. |
Junjie Gu | 32644d9 | 2011-04-13 16:15:29 +0000 | [diff] [blame] | 205 | if (Threshold != NoThreshold) { |
Owen Anderson | f9a26b8 | 2010-09-09 20:32:23 +0000 | [diff] [blame] | 206 | unsigned NumInlineCandidates; |
James Molloy | 67ae135 | 2012-12-20 16:04:27 +0000 | [diff] [blame] | 207 | bool notDuplicatable; |
| 208 | unsigned LoopSize = ApproximateLoopSize(L, NumInlineCandidates, |
Chandler Carruth | a5157e6 | 2013-01-21 13:04:33 +0000 | [diff] [blame] | 209 | notDuplicatable, TTI); |
David Greene | d241e38 | 2010-01-05 01:27:44 +0000 | [diff] [blame] | 210 | DEBUG(dbgs() << " Loop Size = " << LoopSize << "\n"); |
James Molloy | 67ae135 | 2012-12-20 16:04:27 +0000 | [diff] [blame] | 211 | if (notDuplicatable) { |
| 212 | DEBUG(dbgs() << " Not unrolling loop which contains non duplicatable" |
| 213 | << " instructions.\n"); |
| 214 | return false; |
| 215 | } |
Owen Anderson | f9a26b8 | 2010-09-09 20:32:23 +0000 | [diff] [blame] | 216 | if (NumInlineCandidates != 0) { |
| 217 | DEBUG(dbgs() << " Not unrolling loop with inlinable calls.\n"); |
Owen Anderson | 547462b | 2010-09-09 20:02:23 +0000 | [diff] [blame] | 218 | return false; |
Jakob Stoklund Olesen | d450e5b | 2010-02-05 23:21:31 +0000 | [diff] [blame] | 219 | } |
Owen Anderson | 69daca5 | 2010-09-29 18:05:19 +0000 | [diff] [blame] | 220 | uint64_t Size = (uint64_t)LoopSize*Count; |
Junjie Gu | 32644d9 | 2011-04-13 16:15:29 +0000 | [diff] [blame] | 221 | if (TripCount != 1 && Size > Threshold) { |
David Greene | d241e38 | 2010-01-05 01:27:44 +0000 | [diff] [blame] | 222 | DEBUG(dbgs() << " Too large to fully unroll with count: " << Count |
Junjie Gu | 32644d9 | 2011-04-13 16:15:29 +0000 | [diff] [blame] | 223 | << " because size: " << Size << ">" << Threshold << "\n"); |
Hal Finkel | 4f7e2c3 | 2013-09-11 19:25:43 +0000 | [diff] [blame^] | 224 | bool AllowPartial = UserAllowPartial ? CurrentAllowPartial : UP.Partial; |
| 225 | if (!AllowPartial && !(Runtime && TripCount == 0)) { |
David Greene | d241e38 | 2010-01-05 01:27:44 +0000 | [diff] [blame] | 226 | DEBUG(dbgs() << " will not try to unroll partially because " |
Andreas Bolka | 52e539c | 2009-08-13 02:45:03 +0000 | [diff] [blame] | 227 | << "-unroll-allow-partial not given\n"); |
Matthijs Kooijman | 75cf9cc | 2008-07-29 13:21:23 +0000 | [diff] [blame] | 228 | return false; |
| 229 | } |
Andrew Trick | 5d73448 | 2011-12-09 06:19:40 +0000 | [diff] [blame] | 230 | if (TripCount) { |
| 231 | // Reduce unroll count to be modulo of TripCount for partial unrolling |
Hongbin Zheng | 00b73a5 | 2012-04-04 11:44:08 +0000 | [diff] [blame] | 232 | Count = Threshold / LoopSize; |
Andrew Trick | 5d73448 | 2011-12-09 06:19:40 +0000 | [diff] [blame] | 233 | while (Count != 0 && TripCount%Count != 0) |
| 234 | Count--; |
| 235 | } |
Hal Finkel | 4f7e2c3 | 2013-09-11 19:25:43 +0000 | [diff] [blame^] | 236 | else if (Runtime) { |
Andrew Trick | 5d73448 | 2011-12-09 06:19:40 +0000 | [diff] [blame] | 237 | // Reduce unroll count to be a lower power-of-two value |
Hongbin Zheng | 00b73a5 | 2012-04-04 11:44:08 +0000 | [diff] [blame] | 238 | while (Count != 0 && Size > Threshold) { |
Andrew Trick | 5d73448 | 2011-12-09 06:19:40 +0000 | [diff] [blame] | 239 | Count >>= 1; |
| 240 | Size = LoopSize*Count; |
| 241 | } |
Andreas Bolka | ec40eb4 | 2009-08-13 03:00:57 +0000 | [diff] [blame] | 242 | } |
| 243 | if (Count < 2) { |
David Greene | d241e38 | 2010-01-05 01:27:44 +0000 | [diff] [blame] | 244 | DEBUG(dbgs() << " could not unroll partially\n"); |
Andreas Bolka | ec40eb4 | 2009-08-13 03:00:57 +0000 | [diff] [blame] | 245 | return false; |
| 246 | } |
David Greene | d241e38 | 2010-01-05 01:27:44 +0000 | [diff] [blame] | 247 | DEBUG(dbgs() << " partially unrolling with count: " << Count << "\n"); |
Dan Gohman | c767844 | 2007-05-11 20:53:41 +0000 | [diff] [blame] | 248 | } |
| 249 | } |
| 250 | |
Dan Gohman | 45b3197 | 2008-05-14 00:24:14 +0000 | [diff] [blame] | 251 | // Unroll the loop. |
Hal Finkel | 4f7e2c3 | 2013-09-11 19:25:43 +0000 | [diff] [blame^] | 252 | if (!UnrollLoop(L, Count, TripCount, Runtime, TripMultiple, LI, &LPM)) |
Dan Gohman | 45b3197 | 2008-05-14 00:24:14 +0000 | [diff] [blame] | 253 | return false; |
Dan Gohman | c767844 | 2007-05-11 20:53:41 +0000 | [diff] [blame] | 254 | |
Chris Lattner | 83bf288 | 2004-04-18 05:20:17 +0000 | [diff] [blame] | 255 | return true; |
| 256 | } |