Chris Lattner | f48f777 | 2004-04-19 18:07:02 +0000 | [diff] [blame] | 1 | //===-- LoopUnswitch.cpp - Hoist loop-invariant conditionals in loop ------===// |
Misha Brukman | b1c9317 | 2005-04-21 23:48:37 +0000 | [diff] [blame] | 2 | // |
Chris Lattner | f48f777 | 2004-04-19 18:07:02 +0000 | [diff] [blame] | 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
Chris Lattner | f3ebc3f | 2007-12-29 20:36:04 +0000 | [diff] [blame] | 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
Misha Brukman | b1c9317 | 2005-04-21 23:48:37 +0000 | [diff] [blame] | 7 | // |
Chris Lattner | f48f777 | 2004-04-19 18:07:02 +0000 | [diff] [blame] | 8 | //===----------------------------------------------------------------------===// |
| 9 | // |
| 10 | // This pass transforms loops that contain branches on loop-invariant conditions |
| 11 | // to have multiple loops. For example, it turns the left into the right code: |
| 12 | // |
| 13 | // for (...) if (lic) |
| 14 | // A for (...) |
| 15 | // if (lic) A; B; C |
| 16 | // B else |
| 17 | // C for (...) |
| 18 | // A; C |
| 19 | // |
| 20 | // This can increase the size of the code exponentially (doubling it every time |
| 21 | // a loop is unswitched) so we only unswitch if the resultant code will be |
| 22 | // smaller than a threshold. |
| 23 | // |
| 24 | // This pass expects LICM to be run before it to hoist invariant conditions out |
| 25 | // of the loop, to make the unswitching opportunity obvious. |
| 26 | // |
| 27 | //===----------------------------------------------------------------------===// |
| 28 | |
Chris Lattner | f48f777 | 2004-04-19 18:07:02 +0000 | [diff] [blame] | 29 | #include "llvm/Transforms/Scalar.h" |
Chandler Carruth | ed0881b | 2012-12-03 16:50:05 +0000 | [diff] [blame] | 30 | #include "llvm/ADT/STLExtras.h" |
| 31 | #include "llvm/ADT/SmallPtrSet.h" |
| 32 | #include "llvm/ADT/Statistic.h" |
James Molloy | efbba72 | 2015-09-10 10:22:12 +0000 | [diff] [blame] | 33 | #include "llvm/Analysis/GlobalsModRef.h" |
Chandler Carruth | 66b3130 | 2015-01-04 12:03:27 +0000 | [diff] [blame] | 34 | #include "llvm/Analysis/AssumptionCache.h" |
Chandler Carruth | ed0881b | 2012-12-03 16:50:05 +0000 | [diff] [blame] | 35 | #include "llvm/Analysis/CodeMetrics.h" |
Chandler Carruth | ed0881b | 2012-12-03 16:50:05 +0000 | [diff] [blame] | 36 | #include "llvm/Analysis/InstructionSimplify.h" |
| 37 | #include "llvm/Analysis/LoopInfo.h" |
| 38 | #include "llvm/Analysis/LoopPass.h" |
| 39 | #include "llvm/Analysis/ScalarEvolution.h" |
Chandler Carruth | bb9caa9 | 2013-01-21 13:04:33 +0000 | [diff] [blame] | 40 | #include "llvm/Analysis/TargetTransformInfo.h" |
Chen Li | 9f27fc0 | 2015-09-29 05:03:32 +0000 | [diff] [blame] | 41 | #include "llvm/Analysis/BlockFrequencyInfoImpl.h" |
| 42 | #include "llvm/Analysis/BlockFrequencyInfo.h" |
| 43 | #include "llvm/Analysis/BranchProbabilityInfo.h" |
| 44 | #include "llvm/Support/BranchProbability.h" |
Chandler Carruth | 9fb823b | 2013-01-02 11:36:10 +0000 | [diff] [blame] | 45 | #include "llvm/IR/Constants.h" |
| 46 | #include "llvm/IR/DerivedTypes.h" |
Chandler Carruth | 5ad5f15 | 2014-01-13 09:26:24 +0000 | [diff] [blame] | 47 | #include "llvm/IR/Dominators.h" |
Chandler Carruth | 9fb823b | 2013-01-02 11:36:10 +0000 | [diff] [blame] | 48 | #include "llvm/IR/Function.h" |
| 49 | #include "llvm/IR/Instructions.h" |
Mehdi Amini | a28d91d | 2015-03-10 02:37:25 +0000 | [diff] [blame] | 50 | #include "llvm/IR/Module.h" |
Weiming Zhao | f1abad5 | 2015-06-23 05:31:09 +0000 | [diff] [blame] | 51 | #include "llvm/IR/MDBuilder.h" |
Chris Lattner | 8976219 | 2006-02-09 20:15:48 +0000 | [diff] [blame] | 52 | #include "llvm/Support/CommandLine.h" |
Reid Spencer | 557ab15 | 2007-02-05 23:32:05 +0000 | [diff] [blame] | 53 | #include "llvm/Support/Debug.h" |
Daniel Dunbar | 0dd5e1e | 2009-07-25 00:23:56 +0000 | [diff] [blame] | 54 | #include "llvm/Support/raw_ostream.h" |
Chandler Carruth | ed0881b | 2012-12-03 16:50:05 +0000 | [diff] [blame] | 55 | #include "llvm/Transforms/Utils/BasicBlockUtils.h" |
| 56 | #include "llvm/Transforms/Utils/Cloning.h" |
| 57 | #include "llvm/Transforms/Utils/Local.h" |
Alkis Evlogimenos | a5c04ee | 2004-09-03 18:19:51 +0000 | [diff] [blame] | 58 | #include <algorithm> |
Stepan Dyatkovskiy | cb2adbac | 2012-01-15 09:44:07 +0000 | [diff] [blame] | 59 | #include <map> |
Chris Lattner | 2826e05 | 2006-02-09 19:14:52 +0000 | [diff] [blame] | 60 | #include <set> |
Chris Lattner | f48f777 | 2004-04-19 18:07:02 +0000 | [diff] [blame] | 61 | using namespace llvm; |
| 62 | |
Chandler Carruth | 964daaa | 2014-04-22 02:55:47 +0000 | [diff] [blame] | 63 | #define DEBUG_TYPE "loop-unswitch" |
| 64 | |
Chris Lattner | 79a42ac | 2006-12-19 21:40:18 +0000 | [diff] [blame] | 65 | STATISTIC(NumBranches, "Number of branches unswitched"); |
| 66 | STATISTIC(NumSwitches, "Number of switches unswitched"); |
| 67 | STATISTIC(NumSelects , "Number of selects unswitched"); |
| 68 | STATISTIC(NumTrivial , "Number of unswitches that are trivial"); |
| 69 | STATISTIC(NumSimplify, "Number of simplifications of unswitched code"); |
Stepan Dyatkovskiy | 8216569 | 2012-01-11 08:40:51 +0000 | [diff] [blame] | 70 | STATISTIC(TotalInsts, "Total number of instructions analyzed"); |
Chris Lattner | 79a42ac | 2006-12-19 21:40:18 +0000 | [diff] [blame] | 71 | |
Stepan Dyatkovskiy | 2931a59 | 2012-01-16 20:48:04 +0000 | [diff] [blame] | 72 | // The specific value of 100 here was chosen based only on intuition and a |
Dan Gohman | 71ca652 | 2009-10-13 17:50:43 +0000 | [diff] [blame] | 73 | // few specific examples. |
Dan Gohman | d78c400 | 2008-05-13 00:00:25 +0000 | [diff] [blame] | 74 | static cl::opt<unsigned> |
| 75 | Threshold("loop-unswitch-threshold", cl::desc("Max loop size to unswitch"), |
Stepan Dyatkovskiy | 8216569 | 2012-01-11 08:40:51 +0000 | [diff] [blame] | 76 | cl::init(100), cl::Hidden); |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 77 | |
Chen Li | 9f27fc0 | 2015-09-29 05:03:32 +0000 | [diff] [blame] | 78 | static cl::opt<bool> |
| 79 | LoopUnswitchWithBlockFrequency("loop-unswitch-with-block-frequency", |
| 80 | cl::init(false), cl::Hidden, |
| 81 | cl::desc("Enable the use of the block frequency analysis to access PGO " |
| 82 | "heuristics to minimize code growth in cold regions.")); |
| 83 | |
| 84 | static cl::opt<unsigned> |
| 85 | ColdnessThreshold("loop-unswitch-coldness-threshold", cl::init(1), cl::Hidden, |
| 86 | cl::desc("Coldness threshold in percentage. The loop header frequency " |
| 87 | "(relative to the entry frequency) is compared with this " |
| 88 | "threshold to determine if non-trivial unswitching should be " |
| 89 | "enabled.")); |
| 90 | |
Dan Gohman | d78c400 | 2008-05-13 00:00:25 +0000 | [diff] [blame] | 91 | namespace { |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 92 | |
Stepan Dyatkovskiy | cb2adbac | 2012-01-15 09:44:07 +0000 | [diff] [blame] | 93 | class LUAnalysisCache { |
| 94 | |
| 95 | typedef DenseMap<const SwitchInst*, SmallPtrSet<const Value *, 8> > |
| 96 | UnswitchedValsMap; |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 97 | |
Stepan Dyatkovskiy | cb2adbac | 2012-01-15 09:44:07 +0000 | [diff] [blame] | 98 | typedef UnswitchedValsMap::iterator UnswitchedValsIt; |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 99 | |
Stepan Dyatkovskiy | cb2adbac | 2012-01-15 09:44:07 +0000 | [diff] [blame] | 100 | struct LoopProperties { |
| 101 | unsigned CanBeUnswitchedCount; |
Mark Heffernan | 9b536a6 | 2015-06-23 18:26:50 +0000 | [diff] [blame] | 102 | unsigned WasUnswitchedCount; |
Stepan Dyatkovskiy | cb2adbac | 2012-01-15 09:44:07 +0000 | [diff] [blame] | 103 | unsigned SizeEstimation; |
| 104 | UnswitchedValsMap UnswitchedVals; |
| 105 | }; |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 106 | |
| 107 | // Here we use std::map instead of DenseMap, since we need to keep valid |
Stepan Dyatkovskiy | cb2adbac | 2012-01-15 09:44:07 +0000 | [diff] [blame] | 108 | // LoopProperties pointer for current loop for better performance. |
| 109 | typedef std::map<const Loop*, LoopProperties> LoopPropsMap; |
| 110 | typedef LoopPropsMap::iterator LoopPropsMapIt; |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 111 | |
Stepan Dyatkovskiy | cb2adbac | 2012-01-15 09:44:07 +0000 | [diff] [blame] | 112 | LoopPropsMap LoopsProperties; |
Jakub Staszak | 27da123 | 2013-08-06 17:03:42 +0000 | [diff] [blame] | 113 | UnswitchedValsMap *CurLoopInstructions; |
| 114 | LoopProperties *CurrentLoopProperties; |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 115 | |
Mark Heffernan | 9b536a6 | 2015-06-23 18:26:50 +0000 | [diff] [blame] | 116 | // A loop unswitching with an estimated cost above this threshold |
| 117 | // is not performed. MaxSize is turned into unswitching quota for |
| 118 | // the current loop, and reduced correspondingly, though note that |
| 119 | // the quota is returned by releaseMemory() when the loop has been |
| 120 | // processed, so that MaxSize will return to its previous |
| 121 | // value. So in most cases MaxSize will equal the Threshold flag |
| 122 | // when a new loop is processed. An exception to that is that |
| 123 | // MaxSize will have a smaller value while processing nested loops |
| 124 | // that were introduced due to loop unswitching of an outer loop. |
| 125 | // |
| 126 | // FIXME: The way that MaxSize works is subtle and depends on the |
| 127 | // pass manager processing loops and calling releaseMemory() in a |
| 128 | // specific order. It would be good to find a more straightforward |
| 129 | // way of doing what MaxSize does. |
Stepan Dyatkovskiy | cb2adbac | 2012-01-15 09:44:07 +0000 | [diff] [blame] | 130 | unsigned MaxSize; |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 131 | |
Mark Heffernan | 9b536a6 | 2015-06-23 18:26:50 +0000 | [diff] [blame] | 132 | public: |
| 133 | LUAnalysisCache() |
| 134 | : CurLoopInstructions(nullptr), CurrentLoopProperties(nullptr), |
| 135 | MaxSize(Threshold) {} |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 136 | |
Mark Heffernan | 9b536a6 | 2015-06-23 18:26:50 +0000 | [diff] [blame] | 137 | // Analyze loop. Check its size, calculate is it possible to unswitch |
| 138 | // it. Returns true if we can unswitch this loop. |
| 139 | bool countLoop(const Loop *L, const TargetTransformInfo &TTI, |
| 140 | AssumptionCache *AC); |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 141 | |
Mark Heffernan | 9b536a6 | 2015-06-23 18:26:50 +0000 | [diff] [blame] | 142 | // Clean all data related to given loop. |
| 143 | void forgetLoop(const Loop *L); |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 144 | |
Mark Heffernan | 9b536a6 | 2015-06-23 18:26:50 +0000 | [diff] [blame] | 145 | // Mark case value as unswitched. |
| 146 | // Since SI instruction can be partly unswitched, in order to avoid |
| 147 | // extra unswitching in cloned loops keep track all unswitched values. |
| 148 | void setUnswitched(const SwitchInst *SI, const Value *V); |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 149 | |
Mark Heffernan | 9b536a6 | 2015-06-23 18:26:50 +0000 | [diff] [blame] | 150 | // Check was this case value unswitched before or not. |
| 151 | bool isUnswitched(const SwitchInst *SI, const Value *V); |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 152 | |
Mark Heffernan | 9b536a6 | 2015-06-23 18:26:50 +0000 | [diff] [blame] | 153 | // Returns true if another unswitching could be done within the cost |
| 154 | // threshold. |
| 155 | bool CostAllowsUnswitching(); |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 156 | |
Mark Heffernan | 9b536a6 | 2015-06-23 18:26:50 +0000 | [diff] [blame] | 157 | // Clone all loop-unswitch related loop properties. |
| 158 | // Redistribute unswitching quotas. |
| 159 | // Note, that new loop data is stored inside the VMap. |
| 160 | void cloneData(const Loop *NewLoop, const Loop *OldLoop, |
| 161 | const ValueToValueMapTy &VMap); |
Stepan Dyatkovskiy | cb2adbac | 2012-01-15 09:44:07 +0000 | [diff] [blame] | 162 | }; |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 163 | |
Chris Lattner | 2dd09db | 2009-09-02 06:11:42 +0000 | [diff] [blame] | 164 | class LoopUnswitch : public LoopPass { |
Chris Lattner | f48f777 | 2004-04-19 18:07:02 +0000 | [diff] [blame] | 165 | LoopInfo *LI; // Loop information |
Devang Patel | 901a27d | 2007-03-07 00:26:10 +0000 | [diff] [blame] | 166 | LPPassManager *LPM; |
Chandler Carruth | 66b3130 | 2015-01-04 12:03:27 +0000 | [diff] [blame] | 167 | AssumptionCache *AC; |
Chris Lattner | c2e3a7a | 2006-02-18 07:57:38 +0000 | [diff] [blame] | 168 | |
Sanjay Patel | 956e29c | 2015-08-11 21:24:04 +0000 | [diff] [blame] | 169 | // Used to check if second loop needs processing after |
| 170 | // RewriteLoopBodyWithConditionConstant rewrites first loop. |
Chris Lattner | c2e3a7a | 2006-02-18 07:57:38 +0000 | [diff] [blame] | 171 | std::vector<Loop*> LoopProcessWorklist; |
Stepan Dyatkovskiy | cb2adbac | 2012-01-15 09:44:07 +0000 | [diff] [blame] | 172 | |
Stepan Dyatkovskiy | cb2adbac | 2012-01-15 09:44:07 +0000 | [diff] [blame] | 173 | LUAnalysisCache BranchesInfo; |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 174 | |
Chen Li | 9f27fc0 | 2015-09-29 05:03:32 +0000 | [diff] [blame] | 175 | bool EnabledPGO; |
| 176 | |
| 177 | // BFI and ColdEntryFreq are only used when PGO and |
| 178 | // LoopUnswitchWithBlockFrequency are enabled. |
| 179 | BlockFrequencyInfo BFI; |
| 180 | BlockFrequency ColdEntryFreq; |
| 181 | |
Devang Patel | 506310d | 2007-06-06 00:21:03 +0000 | [diff] [blame] | 182 | bool OptimizeForSize; |
Devang Patel | 7d165e1 | 2007-07-30 23:07:10 +0000 | [diff] [blame] | 183 | bool redoLoop; |
Devang Patel | a69f987 | 2007-10-05 22:29:34 +0000 | [diff] [blame] | 184 | |
Devang Patel | e149d4e | 2008-07-02 01:18:13 +0000 | [diff] [blame] | 185 | Loop *currentLoop; |
Devang Patel | a69f987 | 2007-10-05 22:29:34 +0000 | [diff] [blame] | 186 | DominatorTree *DT; |
Devang Patel | e149d4e | 2008-07-02 01:18:13 +0000 | [diff] [blame] | 187 | BasicBlock *loopHeader; |
| 188 | BasicBlock *loopPreheader; |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 189 | |
Devang Patel | ed50fb5 | 2008-07-02 01:44:29 +0000 | [diff] [blame] | 190 | // LoopBlocks contains all of the basic blocks of the loop, including the |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 191 | // preheader of the loop, the body of the loop, and the exit blocks of the |
Devang Patel | ed50fb5 | 2008-07-02 01:44:29 +0000 | [diff] [blame] | 192 | // loop, in that order. |
| 193 | std::vector<BasicBlock*> LoopBlocks; |
| 194 | // NewBlocks contained cloned copy of basic blocks from LoopBlocks. |
| 195 | std::vector<BasicBlock*> NewBlocks; |
Devang Patel | eb611dd | 2008-07-03 17:37:52 +0000 | [diff] [blame] | 196 | |
Chris Lattner | f48f777 | 2004-04-19 18:07:02 +0000 | [diff] [blame] | 197 | public: |
Devang Patel | 8c78a0b | 2007-05-03 01:11:54 +0000 | [diff] [blame] | 198 | static char ID; // Pass ID, replacement for typeid |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 199 | explicit LoopUnswitch(bool Os = false) : |
| 200 | LoopPass(ID), OptimizeForSize(Os), redoLoop(false), |
Craig Topper | f40110f | 2014-04-25 05:29:35 +0000 | [diff] [blame] | 201 | currentLoop(nullptr), DT(nullptr), loopHeader(nullptr), |
| 202 | loopPreheader(nullptr) { |
Owen Anderson | 6c18d1a | 2010-10-19 17:21:58 +0000 | [diff] [blame] | 203 | initializeLoopUnswitchPass(*PassRegistry::getPassRegistry()); |
| 204 | } |
Devang Patel | 09f162c | 2007-05-01 21:15:47 +0000 | [diff] [blame] | 205 | |
Craig Topper | 3e4c697 | 2014-03-05 09:10:37 +0000 | [diff] [blame] | 206 | bool runOnLoop(Loop *L, LPPassManager &LPM) override; |
Devang Patel | e149d4e | 2008-07-02 01:18:13 +0000 | [diff] [blame] | 207 | bool processCurrentLoop(); |
Chris Lattner | f48f777 | 2004-04-19 18:07:02 +0000 | [diff] [blame] | 208 | |
| 209 | /// This transformation requires natural loop information & requires that |
Chris Lattner | bc1a65a | 2010-08-29 17:23:19 +0000 | [diff] [blame] | 210 | /// loop preheaders be inserted into the CFG. |
Chris Lattner | f48f777 | 2004-04-19 18:07:02 +0000 | [diff] [blame] | 211 | /// |
Craig Topper | 3e4c697 | 2014-03-05 09:10:37 +0000 | [diff] [blame] | 212 | void getAnalysisUsage(AnalysisUsage &AU) const override { |
Chandler Carruth | 66b3130 | 2015-01-04 12:03:27 +0000 | [diff] [blame] | 213 | AU.addRequired<AssumptionCacheTracker>(); |
Chris Lattner | f48f777 | 2004-04-19 18:07:02 +0000 | [diff] [blame] | 214 | AU.addRequiredID(LoopSimplifyID); |
Chris Lattner | 4f0e66d | 2006-02-09 22:15:42 +0000 | [diff] [blame] | 215 | AU.addPreservedID(LoopSimplifyID); |
Chandler Carruth | 4f8f307 | 2015-01-17 14:16:18 +0000 | [diff] [blame] | 216 | AU.addRequired<LoopInfoWrapperPass>(); |
| 217 | AU.addPreserved<LoopInfoWrapperPass>(); |
Owen Anderson | fd0a3d6 | 2006-06-12 21:49:21 +0000 | [diff] [blame] | 218 | AU.addRequiredID(LCSSAID); |
Devang Patel | d491198 | 2007-07-31 08:03:26 +0000 | [diff] [blame] | 219 | AU.addPreservedID(LCSSAID); |
Michael Zolotukhin | 9f3aea6 | 2015-09-22 00:22:47 +0000 | [diff] [blame] | 220 | AU.addRequired<DominatorTreeWrapperPass>(); |
Chandler Carruth | 7352302 | 2014-01-13 13:07:17 +0000 | [diff] [blame] | 221 | AU.addPreserved<DominatorTreeWrapperPass>(); |
Chandler Carruth | 2f1fd16 | 2015-08-17 02:08:17 +0000 | [diff] [blame] | 222 | AU.addPreserved<ScalarEvolutionWrapperPass>(); |
Chandler Carruth | 705b185 | 2015-01-31 03:43:40 +0000 | [diff] [blame] | 223 | AU.addRequired<TargetTransformInfoWrapperPass>(); |
James Molloy | efbba72 | 2015-09-10 10:22:12 +0000 | [diff] [blame] | 224 | AU.addPreserved<GlobalsAAWrapperPass>(); |
Chris Lattner | f48f777 | 2004-04-19 18:07:02 +0000 | [diff] [blame] | 225 | } |
| 226 | |
| 227 | private: |
Devang Patel | d491198 | 2007-07-31 08:03:26 +0000 | [diff] [blame] | 228 | |
Craig Topper | 3e4c697 | 2014-03-05 09:10:37 +0000 | [diff] [blame] | 229 | void releaseMemory() override { |
Stepan Dyatkovskiy | cb2adbac | 2012-01-15 09:44:07 +0000 | [diff] [blame] | 230 | BranchesInfo.forgetLoop(currentLoop); |
Dan Gohman | 3ddbc24 | 2009-09-08 15:45:00 +0000 | [diff] [blame] | 231 | } |
| 232 | |
Devang Patel | e149d4e | 2008-07-02 01:18:13 +0000 | [diff] [blame] | 233 | void initLoopData() { |
| 234 | loopHeader = currentLoop->getHeader(); |
| 235 | loopPreheader = currentLoop->getLoopPreheader(); |
| 236 | } |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 237 | |
Chris Lattner | 559c867 | 2008-04-21 00:25:49 +0000 | [diff] [blame] | 238 | /// Split all of the edges from inside the loop to their exit blocks. |
| 239 | /// Update the appropriate Phi nodes as we do so. |
Sanjay Patel | 41f3d95 | 2015-08-11 21:11:56 +0000 | [diff] [blame] | 240 | void SplitExitEdges(Loop *L, |
| 241 | const SmallVectorImpl<BasicBlock *> &ExitBlocks); |
Devang Patel | a69f987 | 2007-10-05 22:29:34 +0000 | [diff] [blame] | 242 | |
Chen Li | c0f3a15 | 2015-07-22 05:26:29 +0000 | [diff] [blame] | 243 | bool TryTrivialLoopUnswitch(bool &Changed); |
| 244 | |
Weiming Zhao | f1abad5 | 2015-06-23 05:31:09 +0000 | [diff] [blame] | 245 | bool UnswitchIfProfitable(Value *LoopCond, Constant *Val, |
| 246 | TerminatorInst *TI = nullptr); |
Chris Lattner | 29f771b | 2006-02-18 01:27:45 +0000 | [diff] [blame] | 247 | void UnswitchTrivialCondition(Loop *L, Value *Cond, Constant *Val, |
Weiming Zhao | f1abad5 | 2015-06-23 05:31:09 +0000 | [diff] [blame] | 248 | BasicBlock *ExitBlock, TerminatorInst *TI); |
| 249 | void UnswitchNontrivialCondition(Value *LIC, Constant *OnVal, Loop *L, |
| 250 | TerminatorInst *TI); |
Chris Lattner | c2e3a7a | 2006-02-18 07:57:38 +0000 | [diff] [blame] | 251 | |
| 252 | void RewriteLoopBodyWithConditionConstant(Loop *L, Value *LIC, |
| 253 | Constant *Val, bool isEqual); |
Devang Patel | 3304e46 | 2007-06-28 00:49:00 +0000 | [diff] [blame] | 254 | |
| 255 | void EmitPreheaderBranchOnCondition(Value *LIC, Constant *Val, |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 256 | BasicBlock *TrueDest, |
Devang Patel | 3304e46 | 2007-06-28 00:49:00 +0000 | [diff] [blame] | 257 | BasicBlock *FalseDest, |
Weiming Zhao | f1abad5 | 2015-06-23 05:31:09 +0000 | [diff] [blame] | 258 | Instruction *InsertPt, |
| 259 | TerminatorInst *TI); |
Devang Patel | 3304e46 | 2007-06-28 00:49:00 +0000 | [diff] [blame] | 260 | |
Devang Patel | d491198 | 2007-07-31 08:03:26 +0000 | [diff] [blame] | 261 | void SimplifyCode(std::vector<Instruction*> &Worklist, Loop *L); |
Chris Lattner | f48f777 | 2004-04-19 18:07:02 +0000 | [diff] [blame] | 262 | }; |
Alexander Kornienko | f00654e | 2015-06-23 09:49:53 +0000 | [diff] [blame] | 263 | } |
Stepan Dyatkovskiy | cb2adbac | 2012-01-15 09:44:07 +0000 | [diff] [blame] | 264 | |
| 265 | // Analyze loop. Check its size, calculate is it possible to unswitch |
| 266 | // it. Returns true if we can unswitch this loop. |
Hal Finkel | 57f03dd | 2014-09-07 13:49:57 +0000 | [diff] [blame] | 267 | bool LUAnalysisCache::countLoop(const Loop *L, const TargetTransformInfo &TTI, |
Chandler Carruth | 66b3130 | 2015-01-04 12:03:27 +0000 | [diff] [blame] | 268 | AssumptionCache *AC) { |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 269 | |
Jakub Staszak | 27da123 | 2013-08-06 17:03:42 +0000 | [diff] [blame] | 270 | LoopPropsMapIt PropsIt; |
| 271 | bool Inserted; |
Benjamin Kramer | d6f1f84 | 2014-03-02 13:30:33 +0000 | [diff] [blame] | 272 | std::tie(PropsIt, Inserted) = |
Stepan Dyatkovskiy | cb2adbac | 2012-01-15 09:44:07 +0000 | [diff] [blame] | 273 | LoopsProperties.insert(std::make_pair(L, LoopProperties())); |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 274 | |
Jakub Staszak | 27da123 | 2013-08-06 17:03:42 +0000 | [diff] [blame] | 275 | LoopProperties &Props = PropsIt->second; |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 276 | |
Jakub Staszak | 27da123 | 2013-08-06 17:03:42 +0000 | [diff] [blame] | 277 | if (Inserted) { |
Stepan Dyatkovskiy | cb2adbac | 2012-01-15 09:44:07 +0000 | [diff] [blame] | 278 | // New loop. |
| 279 | |
| 280 | // Limit the number of instructions to avoid causing significant code |
| 281 | // expansion, and the number of basic blocks, to avoid loops with |
| 282 | // large numbers of branches which cause loop unswitching to go crazy. |
| 283 | // This is a very ad-hoc heuristic. |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 284 | |
Hal Finkel | 57f03dd | 2014-09-07 13:49:57 +0000 | [diff] [blame] | 285 | SmallPtrSet<const Value *, 32> EphValues; |
Chandler Carruth | 66b3130 | 2015-01-04 12:03:27 +0000 | [diff] [blame] | 286 | CodeMetrics::collectEphemeralValues(L, AC, EphValues); |
Hal Finkel | 57f03dd | 2014-09-07 13:49:57 +0000 | [diff] [blame] | 287 | |
Stepan Dyatkovskiy | cb2adbac | 2012-01-15 09:44:07 +0000 | [diff] [blame] | 288 | // FIXME: This is overly conservative because it does not take into |
| 289 | // consideration code simplification opportunities and code that can |
| 290 | // be shared by the resultant unswitched loops. |
| 291 | CodeMetrics Metrics; |
Mark Heffernan | 9b536a6 | 2015-06-23 18:26:50 +0000 | [diff] [blame] | 292 | for (Loop::block_iterator I = L->block_begin(), E = L->block_end(); I != E; |
| 293 | ++I) |
Hal Finkel | 57f03dd | 2014-09-07 13:49:57 +0000 | [diff] [blame] | 294 | Metrics.analyzeBasicBlock(*I, TTI, EphValues); |
Stepan Dyatkovskiy | cb2adbac | 2012-01-15 09:44:07 +0000 | [diff] [blame] | 295 | |
Mark Heffernan | 9b536a6 | 2015-06-23 18:26:50 +0000 | [diff] [blame] | 296 | Props.SizeEstimation = Metrics.NumInsts; |
Stepan Dyatkovskiy | cb2adbac | 2012-01-15 09:44:07 +0000 | [diff] [blame] | 297 | Props.CanBeUnswitchedCount = MaxSize / (Props.SizeEstimation); |
Mark Heffernan | 9b536a6 | 2015-06-23 18:26:50 +0000 | [diff] [blame] | 298 | Props.WasUnswitchedCount = 0; |
Stepan Dyatkovskiy | cb2adbac | 2012-01-15 09:44:07 +0000 | [diff] [blame] | 299 | MaxSize -= Props.SizeEstimation * Props.CanBeUnswitchedCount; |
James Molloy | 4f6fb95 | 2012-12-20 16:04:27 +0000 | [diff] [blame] | 300 | |
| 301 | if (Metrics.notDuplicatable) { |
| 302 | DEBUG(dbgs() << "NOT unswitching loop %" |
Jakub Staszak | 27da123 | 2013-08-06 17:03:42 +0000 | [diff] [blame] | 303 | << L->getHeader()->getName() << ", contents cannot be " |
| 304 | << "duplicated!\n"); |
James Molloy | 4f6fb95 | 2012-12-20 16:04:27 +0000 | [diff] [blame] | 305 | return false; |
| 306 | } |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 307 | } |
| 308 | |
Stepan Dyatkovskiy | cb2adbac | 2012-01-15 09:44:07 +0000 | [diff] [blame] | 309 | // Be careful. This links are good only before new loop addition. |
| 310 | CurrentLoopProperties = &Props; |
| 311 | CurLoopInstructions = &Props.UnswitchedVals; |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 312 | |
Stepan Dyatkovskiy | cb2adbac | 2012-01-15 09:44:07 +0000 | [diff] [blame] | 313 | return true; |
| 314 | } |
| 315 | |
| 316 | // Clean all data related to given loop. |
Jakub Staszak | 27da123 | 2013-08-06 17:03:42 +0000 | [diff] [blame] | 317 | void LUAnalysisCache::forgetLoop(const Loop *L) { |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 318 | |
Stepan Dyatkovskiy | cb2adbac | 2012-01-15 09:44:07 +0000 | [diff] [blame] | 319 | LoopPropsMapIt LIt = LoopsProperties.find(L); |
| 320 | |
| 321 | if (LIt != LoopsProperties.end()) { |
Jakub Staszak | 27da123 | 2013-08-06 17:03:42 +0000 | [diff] [blame] | 322 | LoopProperties &Props = LIt->second; |
Mark Heffernan | 9b536a6 | 2015-06-23 18:26:50 +0000 | [diff] [blame] | 323 | MaxSize += (Props.CanBeUnswitchedCount + Props.WasUnswitchedCount) * |
| 324 | Props.SizeEstimation; |
Stepan Dyatkovskiy | cb2adbac | 2012-01-15 09:44:07 +0000 | [diff] [blame] | 325 | LoopsProperties.erase(LIt); |
| 326 | } |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 327 | |
Craig Topper | f40110f | 2014-04-25 05:29:35 +0000 | [diff] [blame] | 328 | CurrentLoopProperties = nullptr; |
| 329 | CurLoopInstructions = nullptr; |
Stepan Dyatkovskiy | cb2adbac | 2012-01-15 09:44:07 +0000 | [diff] [blame] | 330 | } |
| 331 | |
| 332 | // Mark case value as unswitched. |
| 333 | // Since SI instruction can be partly unswitched, in order to avoid |
| 334 | // extra unswitching in cloned loops keep track all unswitched values. |
Jakub Staszak | 27da123 | 2013-08-06 17:03:42 +0000 | [diff] [blame] | 335 | void LUAnalysisCache::setUnswitched(const SwitchInst *SI, const Value *V) { |
Stepan Dyatkovskiy | cb2adbac | 2012-01-15 09:44:07 +0000 | [diff] [blame] | 336 | (*CurLoopInstructions)[SI].insert(V); |
| 337 | } |
| 338 | |
| 339 | // Check was this case value unswitched before or not. |
Jakub Staszak | 27da123 | 2013-08-06 17:03:42 +0000 | [diff] [blame] | 340 | bool LUAnalysisCache::isUnswitched(const SwitchInst *SI, const Value *V) { |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 341 | return (*CurLoopInstructions)[SI].count(V); |
Stepan Dyatkovskiy | cb2adbac | 2012-01-15 09:44:07 +0000 | [diff] [blame] | 342 | } |
| 343 | |
Mark Heffernan | 9b536a6 | 2015-06-23 18:26:50 +0000 | [diff] [blame] | 344 | bool LUAnalysisCache::CostAllowsUnswitching() { |
| 345 | return CurrentLoopProperties->CanBeUnswitchedCount > 0; |
| 346 | } |
| 347 | |
Stepan Dyatkovskiy | cb2adbac | 2012-01-15 09:44:07 +0000 | [diff] [blame] | 348 | // Clone all loop-unswitch related loop properties. |
| 349 | // Redistribute unswitching quotas. |
| 350 | // Note, that new loop data is stored inside the VMap. |
Jakub Staszak | 27da123 | 2013-08-06 17:03:42 +0000 | [diff] [blame] | 351 | void LUAnalysisCache::cloneData(const Loop *NewLoop, const Loop *OldLoop, |
| 352 | const ValueToValueMapTy &VMap) { |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 353 | |
Jakub Staszak | 27da123 | 2013-08-06 17:03:42 +0000 | [diff] [blame] | 354 | LoopProperties &NewLoopProps = LoopsProperties[NewLoop]; |
| 355 | LoopProperties &OldLoopProps = *CurrentLoopProperties; |
| 356 | UnswitchedValsMap &Insts = OldLoopProps.UnswitchedVals; |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 357 | |
Stepan Dyatkovskiy | cb2adbac | 2012-01-15 09:44:07 +0000 | [diff] [blame] | 358 | // Reallocate "can-be-unswitched quota" |
| 359 | |
| 360 | --OldLoopProps.CanBeUnswitchedCount; |
Mark Heffernan | 9b536a6 | 2015-06-23 18:26:50 +0000 | [diff] [blame] | 361 | ++OldLoopProps.WasUnswitchedCount; |
| 362 | NewLoopProps.WasUnswitchedCount = 0; |
Stepan Dyatkovskiy | cb2adbac | 2012-01-15 09:44:07 +0000 | [diff] [blame] | 363 | unsigned Quota = OldLoopProps.CanBeUnswitchedCount; |
| 364 | NewLoopProps.CanBeUnswitchedCount = Quota / 2; |
| 365 | OldLoopProps.CanBeUnswitchedCount = Quota - Quota / 2; |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 366 | |
Stepan Dyatkovskiy | cb2adbac | 2012-01-15 09:44:07 +0000 | [diff] [blame] | 367 | NewLoopProps.SizeEstimation = OldLoopProps.SizeEstimation; |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 368 | |
Stepan Dyatkovskiy | cb2adbac | 2012-01-15 09:44:07 +0000 | [diff] [blame] | 369 | // Clone unswitched values info: |
| 370 | // for new loop switches we clone info about values that was |
| 371 | // already unswitched and has redundant successors. |
| 372 | for (UnswitchedValsIt I = Insts.begin(); I != Insts.end(); ++I) { |
Jakub Staszak | 27da123 | 2013-08-06 17:03:42 +0000 | [diff] [blame] | 373 | const SwitchInst *OldInst = I->first; |
| 374 | Value *NewI = VMap.lookup(OldInst); |
| 375 | const SwitchInst *NewInst = cast_or_null<SwitchInst>(NewI); |
Stepan Dyatkovskiy | cb2adbac | 2012-01-15 09:44:07 +0000 | [diff] [blame] | 376 | assert(NewInst && "All instructions that are in SrcBB must be in VMap."); |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 377 | |
Stepan Dyatkovskiy | cb2adbac | 2012-01-15 09:44:07 +0000 | [diff] [blame] | 378 | NewLoopProps.UnswitchedVals[NewInst] = OldLoopProps.UnswitchedVals[OldInst]; |
| 379 | } |
| 380 | } |
| 381 | |
Dan Gohman | d78c400 | 2008-05-13 00:00:25 +0000 | [diff] [blame] | 382 | char LoopUnswitch::ID = 0; |
Owen Anderson | 8ac477f | 2010-10-12 19:48:12 +0000 | [diff] [blame] | 383 | INITIALIZE_PASS_BEGIN(LoopUnswitch, "loop-unswitch", "Unswitch loops", |
| 384 | false, false) |
Chandler Carruth | 705b185 | 2015-01-31 03:43:40 +0000 | [diff] [blame] | 385 | INITIALIZE_PASS_DEPENDENCY(TargetTransformInfoWrapperPass) |
Chandler Carruth | 66b3130 | 2015-01-04 12:03:27 +0000 | [diff] [blame] | 386 | INITIALIZE_PASS_DEPENDENCY(AssumptionCacheTracker) |
Owen Anderson | 8ac477f | 2010-10-12 19:48:12 +0000 | [diff] [blame] | 387 | INITIALIZE_PASS_DEPENDENCY(LoopSimplify) |
Chandler Carruth | 4f8f307 | 2015-01-17 14:16:18 +0000 | [diff] [blame] | 388 | INITIALIZE_PASS_DEPENDENCY(LoopInfoWrapperPass) |
Owen Anderson | 8ac477f | 2010-10-12 19:48:12 +0000 | [diff] [blame] | 389 | INITIALIZE_PASS_DEPENDENCY(LCSSA) |
Owen Anderson | 8ac477f | 2010-10-12 19:48:12 +0000 | [diff] [blame] | 390 | INITIALIZE_PASS_END(LoopUnswitch, "loop-unswitch", "Unswitch loops", |
| 391 | false, false) |
Chris Lattner | f48f777 | 2004-04-19 18:07:02 +0000 | [diff] [blame] | 392 | |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 393 | Pass *llvm::createLoopUnswitchPass(bool Os) { |
| 394 | return new LoopUnswitch(Os); |
Devang Patel | 506310d | 2007-06-06 00:21:03 +0000 | [diff] [blame] | 395 | } |
Chris Lattner | c2e3a7a | 2006-02-18 07:57:38 +0000 | [diff] [blame] | 396 | |
Sanjay Patel | 956e29c | 2015-08-11 21:24:04 +0000 | [diff] [blame] | 397 | /// Cond is a condition that occurs in L. If it is invariant in the loop, or has |
| 398 | /// an invariant piece, return the invariant. Otherwise, return null. |
Chris Lattner | c2e3a7a | 2006-02-18 07:57:38 +0000 | [diff] [blame] | 399 | static Value *FindLIVLoopCondition(Value *Cond, Loop *L, bool &Changed) { |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 400 | |
Stepan Dyatkovskiy | 8216569 | 2012-01-11 08:40:51 +0000 | [diff] [blame] | 401 | // We started analyze new instruction, increment scanned instructions counter. |
| 402 | ++TotalInsts; |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 403 | |
Chris Lattner | 302240d | 2010-02-02 02:26:54 +0000 | [diff] [blame] | 404 | // We can never unswitch on vector conditions. |
Duncan Sands | 19d0b47 | 2010-02-16 11:11:14 +0000 | [diff] [blame] | 405 | if (Cond->getType()->isVectorTy()) |
Craig Topper | f40110f | 2014-04-25 05:29:35 +0000 | [diff] [blame] | 406 | return nullptr; |
Chris Lattner | 302240d | 2010-02-02 02:26:54 +0000 | [diff] [blame] | 407 | |
Chris Lattner | c2e3a7a | 2006-02-18 07:57:38 +0000 | [diff] [blame] | 408 | // Constants should be folded, not unswitched on! |
Craig Topper | f40110f | 2014-04-25 05:29:35 +0000 | [diff] [blame] | 409 | if (isa<Constant>(Cond)) return nullptr; |
Devang Patel | 3c723c8 | 2007-06-28 00:44:10 +0000 | [diff] [blame] | 410 | |
Chris Lattner | c2e3a7a | 2006-02-18 07:57:38 +0000 | [diff] [blame] | 411 | // TODO: Handle: br (VARIANT|INVARIANT). |
Devang Patel | fe57d10 | 2008-11-03 19:38:07 +0000 | [diff] [blame] | 412 | |
Dan Gohman | 4d6149f | 2009-07-14 01:37:59 +0000 | [diff] [blame] | 413 | // Hoist simple values out. |
Dan Gohman | c43e479 | 2009-07-15 01:25:43 +0000 | [diff] [blame] | 414 | if (L->makeLoopInvariant(Cond, Changed)) |
Dan Gohman | 4d6149f | 2009-07-14 01:37:59 +0000 | [diff] [blame] | 415 | return Cond; |
Dan Gohman | 4d6149f | 2009-07-14 01:37:59 +0000 | [diff] [blame] | 416 | |
Chris Lattner | c2e3a7a | 2006-02-18 07:57:38 +0000 | [diff] [blame] | 417 | if (BinaryOperator *BO = dyn_cast<BinaryOperator>(Cond)) |
| 418 | if (BO->getOpcode() == Instruction::And || |
| 419 | BO->getOpcode() == Instruction::Or) { |
| 420 | // If either the left or right side is invariant, we can unswitch on this, |
| 421 | // which will cause the branch to go away in one loop and the condition to |
| 422 | // simplify in the other one. |
| 423 | if (Value *LHS = FindLIVLoopCondition(BO->getOperand(0), L, Changed)) |
| 424 | return LHS; |
| 425 | if (Value *RHS = FindLIVLoopCondition(BO->getOperand(1), L, Changed)) |
| 426 | return RHS; |
| 427 | } |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 428 | |
Craig Topper | f40110f | 2014-04-25 05:29:35 +0000 | [diff] [blame] | 429 | return nullptr; |
Chris Lattner | c2e3a7a | 2006-02-18 07:57:38 +0000 | [diff] [blame] | 430 | } |
| 431 | |
Devang Patel | 901a27d | 2007-03-07 00:26:10 +0000 | [diff] [blame] | 432 | bool LoopUnswitch::runOnLoop(Loop *L, LPPassManager &LPM_Ref) { |
Paul Robinson | af4e64d | 2014-02-06 00:07:05 +0000 | [diff] [blame] | 433 | if (skipOptnoneFunction(L)) |
| 434 | return false; |
| 435 | |
Chandler Carruth | 66b3130 | 2015-01-04 12:03:27 +0000 | [diff] [blame] | 436 | AC = &getAnalysis<AssumptionCacheTracker>().getAssumptionCache( |
| 437 | *L->getHeader()->getParent()); |
Chandler Carruth | 4f8f307 | 2015-01-17 14:16:18 +0000 | [diff] [blame] | 438 | LI = &getAnalysis<LoopInfoWrapperPass>().getLoopInfo(); |
Devang Patel | 901a27d | 2007-03-07 00:26:10 +0000 | [diff] [blame] | 439 | LPM = &LPM_Ref; |
Michael Zolotukhin | 9f3aea6 | 2015-09-22 00:22:47 +0000 | [diff] [blame] | 440 | DT = &getAnalysis<DominatorTreeWrapperPass>().getDomTree(); |
Devang Patel | e149d4e | 2008-07-02 01:18:13 +0000 | [diff] [blame] | 441 | currentLoop = L; |
Devang Patel | 40519f0 | 2008-09-04 22:43:59 +0000 | [diff] [blame] | 442 | Function *F = currentLoop->getHeader()->getParent(); |
Chen Li | 9f27fc0 | 2015-09-29 05:03:32 +0000 | [diff] [blame] | 443 | |
| 444 | EnabledPGO = F->getEntryCount().hasValue(); |
| 445 | |
| 446 | if (LoopUnswitchWithBlockFrequency && EnabledPGO) { |
| 447 | BranchProbabilityInfo BPI(*F, *LI); |
| 448 | BFI.calculate(*L->getHeader()->getParent(), BPI, *LI); |
| 449 | |
| 450 | // Use BranchProbability to compute a minimum frequency based on |
| 451 | // function entry baseline frequency. Loops with headers below this |
| 452 | // frequency are considered as cold. |
| 453 | const BranchProbability ColdProb(ColdnessThreshold, 100); |
| 454 | ColdEntryFreq = BlockFrequency(BFI.getEntryFreq()) * ColdProb; |
| 455 | } |
| 456 | |
Chris Lattner | c2e3a7a | 2006-02-18 07:57:38 +0000 | [diff] [blame] | 457 | bool Changed = false; |
Devang Patel | 7d165e1 | 2007-07-30 23:07:10 +0000 | [diff] [blame] | 458 | do { |
Michael Zolotukhin | 9f3aea6 | 2015-09-22 00:22:47 +0000 | [diff] [blame] | 459 | assert(currentLoop->isLCSSAForm(*DT)); |
Devang Patel | 7d165e1 | 2007-07-30 23:07:10 +0000 | [diff] [blame] | 460 | redoLoop = false; |
Devang Patel | e149d4e | 2008-07-02 01:18:13 +0000 | [diff] [blame] | 461 | Changed |= processCurrentLoop(); |
Devang Patel | 7d165e1 | 2007-07-30 23:07:10 +0000 | [diff] [blame] | 462 | } while(redoLoop); |
| 463 | |
Michael Zolotukhin | 9f3aea6 | 2015-09-22 00:22:47 +0000 | [diff] [blame] | 464 | // FIXME: Reconstruct dom info, because it is not preserved properly. |
| 465 | if (Changed) |
| 466 | DT->recalculate(*F); |
Devang Patel | 7d165e1 | 2007-07-30 23:07:10 +0000 | [diff] [blame] | 467 | return Changed; |
| 468 | } |
| 469 | |
Sanjay Patel | 956e29c | 2015-08-11 21:24:04 +0000 | [diff] [blame] | 470 | /// Do actual work and unswitch loop if possible and profitable. |
Devang Patel | e149d4e | 2008-07-02 01:18:13 +0000 | [diff] [blame] | 471 | bool LoopUnswitch::processCurrentLoop() { |
Devang Patel | 7d165e1 | 2007-07-30 23:07:10 +0000 | [diff] [blame] | 472 | bool Changed = false; |
Stepan Dyatkovskiy | 8216569 | 2012-01-11 08:40:51 +0000 | [diff] [blame] | 473 | |
| 474 | initLoopData(); |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 475 | |
Stepan Dyatkovskiy | 8216569 | 2012-01-11 08:40:51 +0000 | [diff] [blame] | 476 | // If LoopSimplify was unable to form a preheader, don't do any unswitching. |
| 477 | if (!loopPreheader) |
| 478 | return false; |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 479 | |
Andrew Trick | 4442bfe | 2012-04-10 05:14:42 +0000 | [diff] [blame] | 480 | // Loops with indirectbr cannot be cloned. |
| 481 | if (!currentLoop->isSafeToClone()) |
| 482 | return false; |
| 483 | |
| 484 | // Without dedicated exits, splitting the exit edge may fail. |
| 485 | if (!currentLoop->hasDedicatedExits()) |
| 486 | return false; |
| 487 | |
Stepan Dyatkovskiy | 8216569 | 2012-01-11 08:40:51 +0000 | [diff] [blame] | 488 | LLVMContext &Context = loopHeader->getContext(); |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 489 | |
Stepan Dyatkovskiy | 8216569 | 2012-01-11 08:40:51 +0000 | [diff] [blame] | 490 | // Probably we reach the quota of branches for this loop. If so |
| 491 | // stop unswitching. |
Chandler Carruth | 705b185 | 2015-01-31 03:43:40 +0000 | [diff] [blame] | 492 | if (!BranchesInfo.countLoop( |
Chandler Carruth | fdb9c57 | 2015-02-01 12:01:35 +0000 | [diff] [blame] | 493 | currentLoop, getAnalysis<TargetTransformInfoWrapperPass>().getTTI( |
| 494 | *currentLoop->getHeader()->getParent()), |
Chandler Carruth | 705b185 | 2015-01-31 03:43:40 +0000 | [diff] [blame] | 495 | AC)) |
Stepan Dyatkovskiy | 8216569 | 2012-01-11 08:40:51 +0000 | [diff] [blame] | 496 | return false; |
Devang Patel | 7d165e1 | 2007-07-30 23:07:10 +0000 | [diff] [blame] | 497 | |
Chen Li | c0f3a15 | 2015-07-22 05:26:29 +0000 | [diff] [blame] | 498 | // Try trivial unswitch first before loop over other basic blocks in the loop. |
| 499 | if (TryTrivialLoopUnswitch(Changed)) { |
| 500 | return true; |
| 501 | } |
| 502 | |
Owen Anderson | 2c9978b | 2015-10-09 18:40:20 +0000 | [diff] [blame^] | 503 | // Do not unswitch loops containing convergent operations, as we might be |
| 504 | // making them control dependent on the unswitch value when they were not |
| 505 | // before. |
| 506 | // FIXME: This could be refined to only bail if the convergent operation is |
| 507 | // not already control-dependent on the unswitch value. |
| 508 | for (const auto BB : currentLoop->blocks()) { |
| 509 | for (const auto &I : *BB) { |
| 510 | const auto CI = dyn_cast<CallInst>(&I); |
| 511 | if (!CI) continue; |
| 512 | if (CI->isConvergent()) |
| 513 | return false; |
| 514 | } |
| 515 | } |
| 516 | |
Chen Li | f458c6f | 2015-08-13 05:24:29 +0000 | [diff] [blame] | 517 | // Do not do non-trivial unswitch while optimizing for size. |
| 518 | // FIXME: Use Function::optForSize(). |
| 519 | if (OptimizeForSize || |
| 520 | loopHeader->getParent()->hasFnAttribute(Attribute::OptimizeForSize)) |
| 521 | return false; |
| 522 | |
Chen Li | 9f27fc0 | 2015-09-29 05:03:32 +0000 | [diff] [blame] | 523 | if (LoopUnswitchWithBlockFrequency && EnabledPGO) { |
| 524 | // Compute the weighted frequency of the hottest block in the |
| 525 | // loop (loopHeader in this case since inner loops should be |
| 526 | // processed before outer loop). If it is less than ColdFrequency, |
| 527 | // we should not unswitch. |
| 528 | BlockFrequency LoopEntryFreq = BFI.getBlockFreq(loopHeader); |
| 529 | if (LoopEntryFreq < ColdEntryFreq) |
| 530 | return false; |
| 531 | } |
| 532 | |
Chris Lattner | c2e3a7a | 2006-02-18 07:57:38 +0000 | [diff] [blame] | 533 | // Loop over all of the basic blocks in the loop. If we find an interior |
| 534 | // block that is branching on a loop-invariant condition, we can unswitch this |
| 535 | // loop. |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 536 | for (Loop::block_iterator I = currentLoop->block_begin(), |
Chris Lattner | c832c1b | 2010-04-05 21:18:32 +0000 | [diff] [blame] | 537 | E = currentLoop->block_end(); I != E; ++I) { |
Chris Lattner | c2e3a7a | 2006-02-18 07:57:38 +0000 | [diff] [blame] | 538 | TerminatorInst *TI = (*I)->getTerminator(); |
| 539 | if (BranchInst *BI = dyn_cast<BranchInst>(TI)) { |
| 540 | // If this isn't branching on an invariant condition, we can't unswitch |
| 541 | // it. |
| 542 | if (BI->isConditional()) { |
| 543 | // See if this, or some part of it, is loop invariant. If so, we can |
| 544 | // unswitch on it if we desire. |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 545 | Value *LoopCond = FindLIVLoopCondition(BI->getCondition(), |
Devang Patel | e149d4e | 2008-07-02 01:18:13 +0000 | [diff] [blame] | 546 | currentLoop, Changed); |
Weiming Zhao | f1abad5 | 2015-06-23 05:31:09 +0000 | [diff] [blame] | 547 | if (LoopCond && |
| 548 | UnswitchIfProfitable(LoopCond, ConstantInt::getTrue(Context), TI)) { |
Chris Lattner | c2e3a7a | 2006-02-18 07:57:38 +0000 | [diff] [blame] | 549 | ++NumBranches; |
| 550 | return true; |
| 551 | } |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 552 | } |
Chris Lattner | c2e3a7a | 2006-02-18 07:57:38 +0000 | [diff] [blame] | 553 | } else if (SwitchInst *SI = dyn_cast<SwitchInst>(TI)) { |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 554 | Value *LoopCond = FindLIVLoopCondition(SI->getCondition(), |
Devang Patel | e149d4e | 2008-07-02 01:18:13 +0000 | [diff] [blame] | 555 | currentLoop, Changed); |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 556 | unsigned NumCases = SI->getNumCases(); |
Stepan Dyatkovskiy | 513aaa5 | 2012-02-01 07:49:51 +0000 | [diff] [blame] | 557 | if (LoopCond && NumCases) { |
Chris Lattner | c2e3a7a | 2006-02-18 07:57:38 +0000 | [diff] [blame] | 558 | // Find a value to unswitch on: |
| 559 | // FIXME: this should chose the most expensive case! |
Nick Lewycky | 6115824 | 2011-06-03 06:27:15 +0000 | [diff] [blame] | 560 | // FIXME: scan for a case with a non-critical edge? |
Craig Topper | f40110f | 2014-04-25 05:29:35 +0000 | [diff] [blame] | 561 | Constant *UnswitchVal = nullptr; |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 562 | |
Devang Patel | 967b84c | 2007-02-26 19:31:58 +0000 | [diff] [blame] | 563 | // Do not process same value again and again. |
Chad Rosier | 3ba90a1 | 2011-12-22 21:10:46 +0000 | [diff] [blame] | 564 | // At this point we have some cases already unswitched and |
| 565 | // some not yet unswitched. Let's find the first not yet unswitched one. |
Stepan Dyatkovskiy | 97b02fc | 2012-03-11 06:09:17 +0000 | [diff] [blame] | 566 | for (SwitchInst::CaseIt i = SI->case_begin(), e = SI->case_end(); |
Stepan Dyatkovskiy | 5b648af | 2012-03-08 07:06:20 +0000 | [diff] [blame] | 567 | i != e; ++i) { |
Jakub Staszak | 27da123 | 2013-08-06 17:03:42 +0000 | [diff] [blame] | 568 | Constant *UnswitchValCandidate = i.getCaseValue(); |
Stepan Dyatkovskiy | cb2adbac | 2012-01-15 09:44:07 +0000 | [diff] [blame] | 569 | if (!BranchesInfo.isUnswitched(SI, UnswitchValCandidate)) { |
Chad Rosier | 3ba90a1 | 2011-12-22 21:10:46 +0000 | [diff] [blame] | 570 | UnswitchVal = UnswitchValCandidate; |
| 571 | break; |
| 572 | } |
| 573 | } |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 574 | |
Chad Rosier | 3ba90a1 | 2011-12-22 21:10:46 +0000 | [diff] [blame] | 575 | if (!UnswitchVal) |
Devang Patel | 967b84c | 2007-02-26 19:31:58 +0000 | [diff] [blame] | 576 | continue; |
Devang Patel | 967b84c | 2007-02-26 19:31:58 +0000 | [diff] [blame] | 577 | |
Devang Patel | e149d4e | 2008-07-02 01:18:13 +0000 | [diff] [blame] | 578 | if (UnswitchIfProfitable(LoopCond, UnswitchVal)) { |
Chris Lattner | c2e3a7a | 2006-02-18 07:57:38 +0000 | [diff] [blame] | 579 | ++NumSwitches; |
| 580 | return true; |
| 581 | } |
| 582 | } |
| 583 | } |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 584 | |
Chris Lattner | c2e3a7a | 2006-02-18 07:57:38 +0000 | [diff] [blame] | 585 | // Scan the instructions to check for unswitchable values. |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 586 | for (BasicBlock::iterator BBI = (*I)->begin(), E = (*I)->end(); |
Chris Lattner | c2e3a7a | 2006-02-18 07:57:38 +0000 | [diff] [blame] | 587 | BBI != E; ++BBI) |
| 588 | if (SelectInst *SI = dyn_cast<SelectInst>(BBI)) { |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 589 | Value *LoopCond = FindLIVLoopCondition(SI->getCondition(), |
Devang Patel | e149d4e | 2008-07-02 01:18:13 +0000 | [diff] [blame] | 590 | currentLoop, Changed); |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 591 | if (LoopCond && UnswitchIfProfitable(LoopCond, |
Owen Anderson | 23a204d | 2009-07-31 17:39:07 +0000 | [diff] [blame] | 592 | ConstantInt::getTrue(Context))) { |
Chris Lattner | c2e3a7a | 2006-02-18 07:57:38 +0000 | [diff] [blame] | 593 | ++NumSelects; |
| 594 | return true; |
| 595 | } |
| 596 | } |
| 597 | } |
Chris Lattner | f48f777 | 2004-04-19 18:07:02 +0000 | [diff] [blame] | 598 | return Changed; |
| 599 | } |
| 600 | |
Sanjay Patel | 956e29c | 2015-08-11 21:24:04 +0000 | [diff] [blame] | 601 | /// Check to see if all paths from BB exit the loop with no side effects |
| 602 | /// (including infinite loops). |
Chris Lattner | e5cb76d | 2006-02-15 22:03:36 +0000 | [diff] [blame] | 603 | /// |
Dan Gohman | 0ad7d9c | 2010-09-01 21:46:45 +0000 | [diff] [blame] | 604 | /// If true, we return true and set ExitBB to the block we |
Chris Lattner | e5cb76d | 2006-02-15 22:03:36 +0000 | [diff] [blame] | 605 | /// exit through. |
| 606 | /// |
| 607 | static bool isTrivialLoopExitBlockHelper(Loop *L, BasicBlock *BB, |
| 608 | BasicBlock *&ExitBB, |
| 609 | std::set<BasicBlock*> &Visited) { |
Chris Lattner | baddba4 | 2006-02-17 06:39:56 +0000 | [diff] [blame] | 610 | if (!Visited.insert(BB).second) { |
Nick Lewycky | d9d1de4 | 2011-12-23 23:49:25 +0000 | [diff] [blame] | 611 | // Already visited. Without more analysis, this could indicate an infinite |
| 612 | // loop. |
Dan Gohman | 0ad7d9c | 2010-09-01 21:46:45 +0000 | [diff] [blame] | 613 | return false; |
Jakub Staszak | 27da123 | 2013-08-06 17:03:42 +0000 | [diff] [blame] | 614 | } |
| 615 | if (!L->contains(BB)) { |
Chris Lattner | baddba4 | 2006-02-17 06:39:56 +0000 | [diff] [blame] | 616 | // Otherwise, this is a loop exit, this is fine so long as this is the |
| 617 | // first exit. |
Craig Topper | f40110f | 2014-04-25 05:29:35 +0000 | [diff] [blame] | 618 | if (ExitBB) return false; |
Chris Lattner | baddba4 | 2006-02-17 06:39:56 +0000 | [diff] [blame] | 619 | ExitBB = BB; |
Edward O'Callaghan | 2b8fed1 | 2009-11-25 05:38:41 +0000 | [diff] [blame] | 620 | return true; |
Chris Lattner | baddba4 | 2006-02-17 06:39:56 +0000 | [diff] [blame] | 621 | } |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 622 | |
Chris Lattner | baddba4 | 2006-02-17 06:39:56 +0000 | [diff] [blame] | 623 | // Otherwise, this is an unvisited intra-loop node. Check all successors. |
Duncan P. N. Exon Smith | 6c99015 | 2014-07-21 17:06:51 +0000 | [diff] [blame] | 624 | for (succ_iterator SI = succ_begin(BB), E = succ_end(BB); SI != E; ++SI) { |
Chris Lattner | baddba4 | 2006-02-17 06:39:56 +0000 | [diff] [blame] | 625 | // Check to see if the successor is a trivial loop exit. |
Duncan P. N. Exon Smith | 6c99015 | 2014-07-21 17:06:51 +0000 | [diff] [blame] | 626 | if (!isTrivialLoopExitBlockHelper(L, *SI, ExitBB, Visited)) |
Chris Lattner | baddba4 | 2006-02-17 06:39:56 +0000 | [diff] [blame] | 627 | return false; |
Chris Lattner | 6e26315 | 2006-02-10 02:30:37 +0000 | [diff] [blame] | 628 | } |
Chris Lattner | e5cb76d | 2006-02-15 22:03:36 +0000 | [diff] [blame] | 629 | |
| 630 | // Okay, everything after this looks good, check to make sure that this block |
| 631 | // doesn't include any side effects. |
Chris Lattner | fdff0bb | 2006-02-15 22:52:05 +0000 | [diff] [blame] | 632 | for (BasicBlock::iterator I = BB->begin(), E = BB->end(); I != E; ++I) |
Duncan Sands | 1efabaa | 2009-05-06 06:49:50 +0000 | [diff] [blame] | 633 | if (I->mayHaveSideEffects()) |
Chris Lattner | e5cb76d | 2006-02-15 22:03:36 +0000 | [diff] [blame] | 634 | return false; |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 635 | |
Chris Lattner | e5cb76d | 2006-02-15 22:03:36 +0000 | [diff] [blame] | 636 | return true; |
Chris Lattner | 6e26315 | 2006-02-10 02:30:37 +0000 | [diff] [blame] | 637 | } |
| 638 | |
Sanjay Patel | 956e29c | 2015-08-11 21:24:04 +0000 | [diff] [blame] | 639 | /// Return true if the specified block unconditionally leads to an exit from |
| 640 | /// the specified loop, and has no side-effects in the process. If so, return |
| 641 | /// the block that is exited to, otherwise return null. |
Chris Lattner | e5cb76d | 2006-02-15 22:03:36 +0000 | [diff] [blame] | 642 | static BasicBlock *isTrivialLoopExitBlock(Loop *L, BasicBlock *BB) { |
| 643 | std::set<BasicBlock*> Visited; |
Dan Gohman | 0ad7d9c | 2010-09-01 21:46:45 +0000 | [diff] [blame] | 644 | Visited.insert(L->getHeader()); // Branches to header make infinite loops. |
Craig Topper | f40110f | 2014-04-25 05:29:35 +0000 | [diff] [blame] | 645 | BasicBlock *ExitBB = nullptr; |
Chris Lattner | e5cb76d | 2006-02-15 22:03:36 +0000 | [diff] [blame] | 646 | if (isTrivialLoopExitBlockHelper(L, BB, ExitBB, Visited)) |
| 647 | return ExitBB; |
Craig Topper | f40110f | 2014-04-25 05:29:35 +0000 | [diff] [blame] | 648 | return nullptr; |
Chris Lattner | e5cb76d | 2006-02-15 22:03:36 +0000 | [diff] [blame] | 649 | } |
Chris Lattner | 6e26315 | 2006-02-10 02:30:37 +0000 | [diff] [blame] | 650 | |
Sanjay Patel | 956e29c | 2015-08-11 21:24:04 +0000 | [diff] [blame] | 651 | /// We have found that we can unswitch currentLoop when LoopCond == Val to |
| 652 | /// simplify the loop. If we decide that this is profitable, |
Chris Lattner | fbadd7e | 2006-02-11 00:43:37 +0000 | [diff] [blame] | 653 | /// unswitch the loop, reprocess the pieces, then return true. |
Weiming Zhao | f1abad5 | 2015-06-23 05:31:09 +0000 | [diff] [blame] | 654 | bool LoopUnswitch::UnswitchIfProfitable(Value *LoopCond, Constant *Val, |
| 655 | TerminatorInst *TI) { |
Evan Cheng | ed66db3 | 2010-04-03 02:23:43 +0000 | [diff] [blame] | 656 | // Check to see if it would be profitable to unswitch current loop. |
Mark Heffernan | 9b536a6 | 2015-06-23 18:26:50 +0000 | [diff] [blame] | 657 | if (!BranchesInfo.CostAllowsUnswitching()) { |
| 658 | DEBUG(dbgs() << "NOT unswitching loop %" |
| 659 | << currentLoop->getHeader()->getName() |
| 660 | << " at non-trivial condition '" << *Val |
| 661 | << "' == " << *LoopCond << "\n" |
| 662 | << ". Cost too high.\n"); |
| 663 | return false; |
| 664 | } |
Evan Cheng | ed66db3 | 2010-04-03 02:23:43 +0000 | [diff] [blame] | 665 | |
Weiming Zhao | f1abad5 | 2015-06-23 05:31:09 +0000 | [diff] [blame] | 666 | UnswitchNontrivialCondition(LoopCond, Val, currentLoop, TI); |
Andrew Trick | 4442bfe | 2012-04-10 05:14:42 +0000 | [diff] [blame] | 667 | return true; |
Chris Lattner | fbadd7e | 2006-02-11 00:43:37 +0000 | [diff] [blame] | 668 | } |
| 669 | |
Sanjay Patel | 956e29c | 2015-08-11 21:24:04 +0000 | [diff] [blame] | 670 | /// Recursively clone the specified loop and all of its children, |
Chris Lattner | f48f777 | 2004-04-19 18:07:02 +0000 | [diff] [blame] | 671 | /// mapping the blocks with the specified map. |
Rafael Espindola | 229e38f | 2010-10-13 01:36:30 +0000 | [diff] [blame] | 672 | static Loop *CloneLoop(Loop *L, Loop *PL, ValueToValueMapTy &VM, |
Devang Patel | 901a27d | 2007-03-07 00:26:10 +0000 | [diff] [blame] | 673 | LoopInfo *LI, LPPassManager *LPM) { |
Chris Lattner | f48f777 | 2004-04-19 18:07:02 +0000 | [diff] [blame] | 674 | Loop *New = new Loop(); |
Devang Patel | 901a27d | 2007-03-07 00:26:10 +0000 | [diff] [blame] | 675 | LPM->insertLoop(New, PL); |
Chris Lattner | f48f777 | 2004-04-19 18:07:02 +0000 | [diff] [blame] | 676 | |
| 677 | // Add all of the blocks in L to the new loop. |
| 678 | for (Loop::block_iterator I = L->block_begin(), E = L->block_end(); |
| 679 | I != E; ++I) |
| 680 | if (LI->getLoopFor(*I) == L) |
Chandler Carruth | 691addc | 2015-01-18 01:25:51 +0000 | [diff] [blame] | 681 | New->addBasicBlockToLoop(cast<BasicBlock>(VM[*I]), *LI); |
Chris Lattner | f48f777 | 2004-04-19 18:07:02 +0000 | [diff] [blame] | 682 | |
| 683 | // Add all of the subloops to the new loop. |
| 684 | for (Loop::iterator I = L->begin(), E = L->end(); I != E; ++I) |
Devang Patel | 901a27d | 2007-03-07 00:26:10 +0000 | [diff] [blame] | 685 | CloneLoop(*I, New, VM, LI, LPM); |
Misha Brukman | b1c9317 | 2005-04-21 23:48:37 +0000 | [diff] [blame] | 686 | |
Chris Lattner | f48f777 | 2004-04-19 18:07:02 +0000 | [diff] [blame] | 687 | return New; |
| 688 | } |
| 689 | |
Weiming Zhao | f1abad5 | 2015-06-23 05:31:09 +0000 | [diff] [blame] | 690 | static void copyMetadata(Instruction *DstInst, const Instruction *SrcInst, |
| 691 | bool Swapped) { |
| 692 | if (!SrcInst || !SrcInst->hasMetadata()) |
| 693 | return; |
| 694 | |
| 695 | SmallVector<std::pair<unsigned, MDNode *>, 4> MDs; |
| 696 | SrcInst->getAllMetadata(MDs); |
| 697 | for (auto &MD : MDs) { |
| 698 | switch (MD.first) { |
| 699 | default: |
| 700 | break; |
| 701 | case LLVMContext::MD_prof: |
| 702 | if (Swapped && MD.second->getNumOperands() == 3 && |
| 703 | isa<MDString>(MD.second->getOperand(0))) { |
| 704 | MDString *MDName = cast<MDString>(MD.second->getOperand(0)); |
| 705 | if (MDName->getString() == "branch_weights") { |
| 706 | auto *ValT = cast_or_null<ConstantAsMetadata>( |
| 707 | MD.second->getOperand(1))->getValue(); |
| 708 | auto *ValF = cast_or_null<ConstantAsMetadata>( |
| 709 | MD.second->getOperand(2))->getValue(); |
| 710 | assert(ValT && ValF && "Invalid Operands of branch_weights"); |
| 711 | auto NewMD = |
| 712 | MDBuilder(DstInst->getParent()->getContext()) |
| 713 | .createBranchWeights(cast<ConstantInt>(ValF)->getZExtValue(), |
| 714 | cast<ConstantInt>(ValT)->getZExtValue()); |
| 715 | MD.second = NewMD; |
| 716 | } |
| 717 | } |
| 718 | // fallthrough. |
Chen Li | 50efd92 | 2015-08-05 21:13:26 +0000 | [diff] [blame] | 719 | case LLVMContext::MD_make_implicit: |
Weiming Zhao | f1abad5 | 2015-06-23 05:31:09 +0000 | [diff] [blame] | 720 | case LLVMContext::MD_dbg: |
| 721 | DstInst->setMetadata(MD.first, MD.second); |
| 722 | } |
| 723 | } |
| 724 | } |
| 725 | |
Sanjay Patel | 956e29c | 2015-08-11 21:24:04 +0000 | [diff] [blame] | 726 | /// Emit a conditional branch on two values if LIC == Val, branch to TrueDst, |
| 727 | /// otherwise branch to FalseDest. Insert the code immediately before InsertPt. |
Devang Patel | 3304e46 | 2007-06-28 00:49:00 +0000 | [diff] [blame] | 728 | void LoopUnswitch::EmitPreheaderBranchOnCondition(Value *LIC, Constant *Val, |
| 729 | BasicBlock *TrueDest, |
| 730 | BasicBlock *FalseDest, |
Weiming Zhao | f1abad5 | 2015-06-23 05:31:09 +0000 | [diff] [blame] | 731 | Instruction *InsertPt, |
| 732 | TerminatorInst *TI) { |
Chris Lattner | b0cbe71 | 2006-02-15 00:07:43 +0000 | [diff] [blame] | 733 | // Insert a conditional branch on LIC to the two preheaders. The original |
| 734 | // code is the true version and the new code is the false version. |
| 735 | Value *BranchVal = LIC; |
Weiming Zhao | f1abad5 | 2015-06-23 05:31:09 +0000 | [diff] [blame] | 736 | bool Swapped = false; |
Owen Anderson | 55f1c09 | 2009-08-13 21:58:54 +0000 | [diff] [blame] | 737 | if (!isa<ConstantInt>(Val) || |
| 738 | Val->getType() != Type::getInt1Ty(LIC->getContext())) |
Benjamin Kramer | 547b6c5 | 2011-09-27 20:39:19 +0000 | [diff] [blame] | 739 | BranchVal = new ICmpInst(InsertPt, ICmpInst::ICMP_EQ, LIC, Val); |
Weiming Zhao | f1abad5 | 2015-06-23 05:31:09 +0000 | [diff] [blame] | 740 | else if (Val != ConstantInt::getTrue(Val->getContext())) { |
Chris Lattner | b0cbe71 | 2006-02-15 00:07:43 +0000 | [diff] [blame] | 741 | // We want to enter the new loop when the condition is true. |
| 742 | std::swap(TrueDest, FalseDest); |
Weiming Zhao | f1abad5 | 2015-06-23 05:31:09 +0000 | [diff] [blame] | 743 | Swapped = true; |
| 744 | } |
Chris Lattner | b0cbe71 | 2006-02-15 00:07:43 +0000 | [diff] [blame] | 745 | |
| 746 | // Insert the new branch. |
Dan Gohman | 3ddbc24 | 2009-09-08 15:45:00 +0000 | [diff] [blame] | 747 | BranchInst *BI = BranchInst::Create(TrueDest, FalseDest, BranchVal, InsertPt); |
Weiming Zhao | f1abad5 | 2015-06-23 05:31:09 +0000 | [diff] [blame] | 748 | copyMetadata(BI, TI, Swapped); |
Dan Gohman | 3ddbc24 | 2009-09-08 15:45:00 +0000 | [diff] [blame] | 749 | |
| 750 | // If either edge is critical, split it. This helps preserve LoopSimplify |
| 751 | // form for enclosing loops. |
Chandler Carruth | f8753fc | 2015-01-19 12:12:00 +0000 | [diff] [blame] | 752 | auto Options = CriticalEdgeSplittingOptions(DT, LI).setPreserveLCSSA(); |
Chandler Carruth | 37df2cf | 2015-01-19 12:09:11 +0000 | [diff] [blame] | 753 | SplitCriticalEdge(BI, 0, Options); |
| 754 | SplitCriticalEdge(BI, 1, Options); |
Chris Lattner | b0cbe71 | 2006-02-15 00:07:43 +0000 | [diff] [blame] | 755 | } |
| 756 | |
Sanjay Patel | 956e29c | 2015-08-11 21:24:04 +0000 | [diff] [blame] | 757 | /// Given a loop that has a trivial unswitchable condition in it (a cond branch |
| 758 | /// from its header block to its latch block, where the path through the loop |
| 759 | /// that doesn't execute its body has no side-effects), unswitch it. This |
| 760 | /// doesn't involve any code duplication, just moving the conditional branch |
| 761 | /// outside of the loop and updating loop info. |
Weiming Zhao | f1abad5 | 2015-06-23 05:31:09 +0000 | [diff] [blame] | 762 | void LoopUnswitch::UnswitchTrivialCondition(Loop *L, Value *Cond, Constant *Val, |
| 763 | BasicBlock *ExitBlock, |
| 764 | TerminatorInst *TI) { |
David Greene | d9c355d | 2010-01-05 01:27:04 +0000 | [diff] [blame] | 765 | DEBUG(dbgs() << "loop-unswitch: Trivial-Unswitch loop %" |
Weiming Zhao | f1abad5 | 2015-06-23 05:31:09 +0000 | [diff] [blame] | 766 | << loopHeader->getName() << " [" << L->getBlocks().size() |
| 767 | << " blocks] in Function " |
| 768 | << L->getHeader()->getParent()->getName() << " on cond: " << *Val |
| 769 | << " == " << *Cond << "\n"); |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 770 | |
Chris Lattner | fe4151e | 2006-02-10 23:16:39 +0000 | [diff] [blame] | 771 | // First step, split the preheader, so that we know that there is a safe place |
Devang Patel | e149d4e | 2008-07-02 01:18:13 +0000 | [diff] [blame] | 772 | // to insert the conditional branch. We will change loopPreheader to have a |
Chris Lattner | ed7a67b | 2006-02-10 01:24:09 +0000 | [diff] [blame] | 773 | // conditional branch on Cond. |
Chandler Carruth | d450056 | 2015-01-19 12:36:53 +0000 | [diff] [blame] | 774 | BasicBlock *NewPH = SplitEdge(loopPreheader, loopHeader, DT, LI); |
Chris Lattner | ed7a67b | 2006-02-10 01:24:09 +0000 | [diff] [blame] | 775 | |
| 776 | // Now that we have a place to insert the conditional branch, create a place |
Chris Lattner | 4935417 | 2006-02-10 02:01:22 +0000 | [diff] [blame] | 777 | // to branch to: this is the exit block out of the loop that we should |
| 778 | // short-circuit to. |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 779 | |
Chris Lattner | e5cb76d | 2006-02-15 22:03:36 +0000 | [diff] [blame] | 780 | // Split this block now, so that the loop maintains its exit block, and so |
| 781 | // that the jump from the preheader can execute the contents of the exit block |
| 782 | // without actually branching to it (the exit block should be dominated by the |
| 783 | // loop header, not the preheader). |
Chris Lattner | 4935417 | 2006-02-10 02:01:22 +0000 | [diff] [blame] | 784 | assert(!L->contains(ExitBlock) && "Exit block is in the loop?"); |
Chandler Carruth | 32c52c7 | 2015-01-18 02:39:37 +0000 | [diff] [blame] | 785 | BasicBlock *NewExit = SplitBlock(ExitBlock, ExitBlock->begin(), DT, LI); |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 786 | |
| 787 | // Okay, now we have a position to branch from and a position to branch to, |
Chris Lattner | ed7a67b | 2006-02-10 01:24:09 +0000 | [diff] [blame] | 788 | // insert the new conditional branch. |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 789 | EmitPreheaderBranchOnCondition(Cond, Val, NewExit, NewPH, |
Weiming Zhao | f1abad5 | 2015-06-23 05:31:09 +0000 | [diff] [blame] | 790 | loopPreheader->getTerminator(), TI); |
Devang Patel | e149d4e | 2008-07-02 01:18:13 +0000 | [diff] [blame] | 791 | LPM->deleteSimpleAnalysisValue(loopPreheader->getTerminator(), L); |
| 792 | loopPreheader->getTerminator()->eraseFromParent(); |
Chris Lattner | ed7a67b | 2006-02-10 01:24:09 +0000 | [diff] [blame] | 793 | |
Chris Lattner | c2e3a7a | 2006-02-18 07:57:38 +0000 | [diff] [blame] | 794 | // We need to reprocess this loop, it could be unswitched again. |
Devang Patel | 7d165e1 | 2007-07-30 23:07:10 +0000 | [diff] [blame] | 795 | redoLoop = true; |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 796 | |
Chris Lattner | ed7a67b | 2006-02-10 01:24:09 +0000 | [diff] [blame] | 797 | // Now that we know that the loop is never entered when this condition is a |
| 798 | // particular value, rewrite the loop with this info. We know that this will |
| 799 | // at least eliminate the old branch. |
Chris Lattner | 8a5a324 | 2006-02-22 06:37:14 +0000 | [diff] [blame] | 800 | RewriteLoopBodyWithConditionConstant(L, Cond, Val, false); |
Chris Lattner | 0b8ec1a | 2006-02-14 01:01:41 +0000 | [diff] [blame] | 801 | ++NumTrivial; |
Chris Lattner | ed7a67b | 2006-02-10 01:24:09 +0000 | [diff] [blame] | 802 | } |
| 803 | |
Sanjay Patel | 41f3d95 | 2015-08-11 21:11:56 +0000 | [diff] [blame] | 804 | /// Check if the first non-constant condition starting from the loop header is |
| 805 | /// a trivial unswitch condition: that is, a condition controls whether or not |
| 806 | /// the loop does anything at all. If it is a trivial condition, unswitching |
| 807 | /// produces no code duplications (equivalently, it produces a simpler loop and |
| 808 | /// a new empty loop, which gets deleted). Therefore always unswitch trivial |
| 809 | /// condition. |
Chen Li | c0f3a15 | 2015-07-22 05:26:29 +0000 | [diff] [blame] | 810 | bool LoopUnswitch::TryTrivialLoopUnswitch(bool &Changed) { |
Chen Li | 145c2f5 | 2015-07-25 03:21:06 +0000 | [diff] [blame] | 811 | BasicBlock *CurrentBB = currentLoop->getHeader(); |
| 812 | TerminatorInst *CurrentTerm = CurrentBB->getTerminator(); |
| 813 | LLVMContext &Context = CurrentBB->getContext(); |
Chen Li | c0f3a15 | 2015-07-22 05:26:29 +0000 | [diff] [blame] | 814 | |
Chen Li | 145c2f5 | 2015-07-25 03:21:06 +0000 | [diff] [blame] | 815 | // If loop header has only one reachable successor (currently via an |
| 816 | // unconditional branch or constant foldable conditional branch, but |
| 817 | // should also consider adding constant foldable switch instruction in |
| 818 | // future), we should keep looking for trivial condition candidates in |
| 819 | // the successor as well. An alternative is to constant fold conditions |
| 820 | // and merge successors into loop header (then we only need to check header's |
| 821 | // terminator). The reason for not doing this in LoopUnswitch pass is that |
| 822 | // it could potentially break LoopPassManager's invariants. Folding dead |
| 823 | // branches could either eliminate the current loop or make other loops |
Sanjay Patel | 41f3d95 | 2015-08-11 21:11:56 +0000 | [diff] [blame] | 824 | // unreachable. LCSSA form might also not be preserved after deleting |
| 825 | // branches. The following code keeps traversing loop header's successors |
| 826 | // until it finds the trivial condition candidate (condition that is not a |
| 827 | // constant). Since unswitching generates branches with constant conditions, |
| 828 | // this scenario could be very common in practice. |
Chen Li | 145c2f5 | 2015-07-25 03:21:06 +0000 | [diff] [blame] | 829 | SmallSet<BasicBlock*, 8> Visited; |
| 830 | |
| 831 | while (true) { |
| 832 | // If we exit loop or reach a previous visited block, then |
| 833 | // we can not reach any trivial condition candidates (unfoldable |
| 834 | // branch instructions or switch instructions) and no unswitch |
| 835 | // can happen. Exit and return false. |
| 836 | if (!currentLoop->contains(CurrentBB) || !Visited.insert(CurrentBB).second) |
Chen Li | c0f3a15 | 2015-07-22 05:26:29 +0000 | [diff] [blame] | 837 | return false; |
| 838 | |
Chen Li | 145c2f5 | 2015-07-25 03:21:06 +0000 | [diff] [blame] | 839 | // Check if this loop will execute any side-effecting instructions (e.g. |
| 840 | // stores, calls, volatile loads) in the part of the loop that the code |
| 841 | // *would* execute. Check the header first. |
| 842 | for (BasicBlock::iterator I : *CurrentBB) |
| 843 | if (I->mayHaveSideEffects()) |
| 844 | return false; |
| 845 | |
| 846 | // FIXME: add check for constant foldable switch instructions. |
| 847 | if (BranchInst *BI = dyn_cast<BranchInst>(CurrentTerm)) { |
| 848 | if (BI->isUnconditional()) { |
| 849 | CurrentBB = BI->getSuccessor(0); |
| 850 | } else if (BI->getCondition() == ConstantInt::getTrue(Context)) { |
| 851 | CurrentBB = BI->getSuccessor(0); |
| 852 | } else if (BI->getCondition() == ConstantInt::getFalse(Context)) { |
| 853 | CurrentBB = BI->getSuccessor(1); |
| 854 | } else { |
Sanjay Patel | 41f3d95 | 2015-08-11 21:11:56 +0000 | [diff] [blame] | 855 | // Found a trivial condition candidate: non-foldable conditional branch. |
Chen Li | 145c2f5 | 2015-07-25 03:21:06 +0000 | [diff] [blame] | 856 | break; |
| 857 | } |
| 858 | } else { |
| 859 | break; |
| 860 | } |
| 861 | |
| 862 | CurrentTerm = CurrentBB->getTerminator(); |
| 863 | } |
| 864 | |
Chen Li | c0f3a15 | 2015-07-22 05:26:29 +0000 | [diff] [blame] | 865 | // CondVal is the condition that controls the trivial condition. |
| 866 | // LoopExitBB is the BasicBlock that loop exits when meets trivial condition. |
| 867 | Constant *CondVal = nullptr; |
| 868 | BasicBlock *LoopExitBB = nullptr; |
| 869 | |
Chen Li | 145c2f5 | 2015-07-25 03:21:06 +0000 | [diff] [blame] | 870 | if (BranchInst *BI = dyn_cast<BranchInst>(CurrentTerm)) { |
Chen Li | c0f3a15 | 2015-07-22 05:26:29 +0000 | [diff] [blame] | 871 | // If this isn't branching on an invariant condition, we can't unswitch it. |
| 872 | if (!BI->isConditional()) |
| 873 | return false; |
| 874 | |
| 875 | Value *LoopCond = FindLIVLoopCondition(BI->getCondition(), |
| 876 | currentLoop, Changed); |
| 877 | |
| 878 | // Unswitch only if the trivial condition itself is an LIV (not |
| 879 | // partial LIV which could occur in and/or) |
| 880 | if (!LoopCond || LoopCond != BI->getCondition()) |
| 881 | return false; |
| 882 | |
| 883 | // Check to see if a successor of the branch is guaranteed to |
| 884 | // exit through a unique exit block without having any |
| 885 | // side-effects. If so, determine the value of Cond that causes |
| 886 | // it to do this. |
| 887 | if ((LoopExitBB = isTrivialLoopExitBlock(currentLoop, |
| 888 | BI->getSuccessor(0)))) { |
| 889 | CondVal = ConstantInt::getTrue(Context); |
| 890 | } else if ((LoopExitBB = isTrivialLoopExitBlock(currentLoop, |
| 891 | BI->getSuccessor(1)))) { |
| 892 | CondVal = ConstantInt::getFalse(Context); |
| 893 | } |
| 894 | |
Sanjay Patel | 41f3d95 | 2015-08-11 21:11:56 +0000 | [diff] [blame] | 895 | // If we didn't find a single unique LoopExit block, or if the loop exit |
| 896 | // block contains phi nodes, this isn't trivial. |
Chen Li | c0f3a15 | 2015-07-22 05:26:29 +0000 | [diff] [blame] | 897 | if (!LoopExitBB || isa<PHINode>(LoopExitBB->begin())) |
| 898 | return false; // Can't handle this. |
| 899 | |
Sanjay Patel | 41f3d95 | 2015-08-11 21:11:56 +0000 | [diff] [blame] | 900 | UnswitchTrivialCondition(currentLoop, LoopCond, CondVal, LoopExitBB, |
| 901 | CurrentTerm); |
Chen Li | c0f3a15 | 2015-07-22 05:26:29 +0000 | [diff] [blame] | 902 | ++NumBranches; |
| 903 | return true; |
Chen Li | 145c2f5 | 2015-07-25 03:21:06 +0000 | [diff] [blame] | 904 | } else if (SwitchInst *SI = dyn_cast<SwitchInst>(CurrentTerm)) { |
Chen Li | c0f3a15 | 2015-07-22 05:26:29 +0000 | [diff] [blame] | 905 | // If this isn't switching on an invariant condition, we can't unswitch it. |
| 906 | Value *LoopCond = FindLIVLoopCondition(SI->getCondition(), |
| 907 | currentLoop, Changed); |
| 908 | |
| 909 | // Unswitch only if the trivial condition itself is an LIV (not |
| 910 | // partial LIV which could occur in and/or) |
| 911 | if (!LoopCond || LoopCond != SI->getCondition()) |
| 912 | return false; |
| 913 | |
| 914 | // Check to see if a successor of the switch is guaranteed to go to the |
| 915 | // latch block or exit through a one exit block without having any |
| 916 | // side-effects. If so, determine the value of Cond that causes it to do |
| 917 | // this. |
| 918 | // Note that we can't trivially unswitch on the default case or |
| 919 | // on already unswitched cases. |
| 920 | for (SwitchInst::CaseIt i = SI->case_begin(), e = SI->case_end(); |
| 921 | i != e; ++i) { |
| 922 | BasicBlock *LoopExitCandidate; |
| 923 | if ((LoopExitCandidate = isTrivialLoopExitBlock(currentLoop, |
| 924 | i.getCaseSuccessor()))) { |
| 925 | // Okay, we found a trivial case, remember the value that is trivial. |
| 926 | ConstantInt *CaseVal = i.getCaseValue(); |
| 927 | |
| 928 | // Check that it was not unswitched before, since already unswitched |
| 929 | // trivial vals are looks trivial too. |
| 930 | if (BranchesInfo.isUnswitched(SI, CaseVal)) |
| 931 | continue; |
| 932 | LoopExitBB = LoopExitCandidate; |
| 933 | CondVal = CaseVal; |
| 934 | break; |
| 935 | } |
| 936 | } |
| 937 | |
Sanjay Patel | 41f3d95 | 2015-08-11 21:11:56 +0000 | [diff] [blame] | 938 | // If we didn't find a single unique LoopExit block, or if the loop exit |
| 939 | // block contains phi nodes, this isn't trivial. |
Chen Li | c0f3a15 | 2015-07-22 05:26:29 +0000 | [diff] [blame] | 940 | if (!LoopExitBB || isa<PHINode>(LoopExitBB->begin())) |
| 941 | return false; // Can't handle this. |
| 942 | |
Sanjay Patel | 41f3d95 | 2015-08-11 21:11:56 +0000 | [diff] [blame] | 943 | UnswitchTrivialCondition(currentLoop, LoopCond, CondVal, LoopExitBB, |
| 944 | nullptr); |
Chen Li | c0f3a15 | 2015-07-22 05:26:29 +0000 | [diff] [blame] | 945 | ++NumSwitches; |
| 946 | return true; |
| 947 | } |
| 948 | return false; |
| 949 | } |
| 950 | |
Sanjay Patel | 956e29c | 2015-08-11 21:24:04 +0000 | [diff] [blame] | 951 | /// Split all of the edges from inside the loop to their exit blocks. |
| 952 | /// Update the appropriate Phi nodes as we do so. |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 953 | void LoopUnswitch::SplitExitEdges(Loop *L, |
Craig Topper | b94011f | 2013-07-14 04:42:23 +0000 | [diff] [blame] | 954 | const SmallVectorImpl<BasicBlock *> &ExitBlocks){ |
Devang Patel | a69f987 | 2007-10-05 22:29:34 +0000 | [diff] [blame] | 955 | |
Chris Lattner | ed7a67b | 2006-02-10 01:24:09 +0000 | [diff] [blame] | 956 | for (unsigned i = 0, e = ExitBlocks.size(); i != e; ++i) { |
Chris Lattner | fe4151e | 2006-02-10 23:16:39 +0000 | [diff] [blame] | 957 | BasicBlock *ExitBlock = ExitBlocks[i]; |
Dan Gohman | 3ddbc24 | 2009-09-08 15:45:00 +0000 | [diff] [blame] | 958 | SmallVector<BasicBlock *, 4> Preds(pred_begin(ExitBlock), |
| 959 | pred_end(ExitBlock)); |
Bill Wendling | 90f90da | 2011-09-27 00:59:31 +0000 | [diff] [blame] | 960 | |
Nick Lewycky | 6115824 | 2011-06-03 06:27:15 +0000 | [diff] [blame] | 961 | // Although SplitBlockPredecessors doesn't preserve loop-simplify in |
| 962 | // general, if we call it on all predecessors of all exits then it does. |
Chandler Carruth | 96ada25 | 2015-07-22 09:52:54 +0000 | [diff] [blame] | 963 | SplitBlockPredecessors(ExitBlock, Preds, ".us-lcssa", DT, LI, |
Philip Reames | 9198b33 | 2015-01-28 23:06:47 +0000 | [diff] [blame] | 964 | /*PreserveLCSSA*/ true); |
Chris Lattner | ed7a67b | 2006-02-10 01:24:09 +0000 | [diff] [blame] | 965 | } |
Devang Patel | e192e325 | 2007-10-03 21:16:08 +0000 | [diff] [blame] | 966 | } |
| 967 | |
Sanjay Patel | 956e29c | 2015-08-11 21:24:04 +0000 | [diff] [blame] | 968 | /// We determined that the loop is profitable to unswitch when LIC equal Val. |
| 969 | /// Split it into loop versions and test the condition outside of either loop. |
| 970 | /// Return the loops created as Out1/Out2. |
Andrew Trick | 4442bfe | 2012-04-10 05:14:42 +0000 | [diff] [blame] | 971 | void LoopUnswitch::UnswitchNontrivialCondition(Value *LIC, Constant *Val, |
Weiming Zhao | f1abad5 | 2015-06-23 05:31:09 +0000 | [diff] [blame] | 972 | Loop *L, TerminatorInst *TI) { |
Devang Patel | e149d4e | 2008-07-02 01:18:13 +0000 | [diff] [blame] | 973 | Function *F = loopHeader->getParent(); |
David Greene | d9c355d | 2010-01-05 01:27:04 +0000 | [diff] [blame] | 974 | DEBUG(dbgs() << "loop-unswitch: Unswitching loop %" |
Daniel Dunbar | 0dd5e1e | 2009-07-25 00:23:56 +0000 | [diff] [blame] | 975 | << loopHeader->getName() << " [" << L->getBlocks().size() |
| 976 | << " blocks] in Function " << F->getName() |
| 977 | << " when '" << *Val << "' == " << *LIC << "\n"); |
Devang Patel | e192e325 | 2007-10-03 21:16:08 +0000 | [diff] [blame] | 978 | |
Chandler Carruth | 2f1fd16 | 2015-08-17 02:08:17 +0000 | [diff] [blame] | 979 | if (auto *SEWP = getAnalysisIfAvailable<ScalarEvolutionWrapperPass>()) |
| 980 | SEWP->getSE().forgetLoop(L); |
Cameron Zwarich | 99de19b | 2011-02-11 06:08:28 +0000 | [diff] [blame] | 981 | |
Devang Patel | ed50fb5 | 2008-07-02 01:44:29 +0000 | [diff] [blame] | 982 | LoopBlocks.clear(); |
| 983 | NewBlocks.clear(); |
Devang Patel | e192e325 | 2007-10-03 21:16:08 +0000 | [diff] [blame] | 984 | |
| 985 | // First step, split the preheader and exit blocks, and add these blocks to |
| 986 | // the LoopBlocks list. |
Chandler Carruth | d450056 | 2015-01-19 12:36:53 +0000 | [diff] [blame] | 987 | BasicBlock *NewPreheader = SplitEdge(loopPreheader, loopHeader, DT, LI); |
Devang Patel | e192e325 | 2007-10-03 21:16:08 +0000 | [diff] [blame] | 988 | LoopBlocks.push_back(NewPreheader); |
| 989 | |
| 990 | // We want the loop to come after the preheader, but before the exit blocks. |
| 991 | LoopBlocks.insert(LoopBlocks.end(), L->block_begin(), L->block_end()); |
| 992 | |
| 993 | SmallVector<BasicBlock*, 8> ExitBlocks; |
| 994 | L->getUniqueExitBlocks(ExitBlocks); |
| 995 | |
| 996 | // Split all of the edges from inside the loop to their exit blocks. Update |
| 997 | // the appropriate Phi nodes as we do so. |
Devang Patel | eb611dd | 2008-07-03 17:37:52 +0000 | [diff] [blame] | 998 | SplitExitEdges(L, ExitBlocks); |
Devang Patel | e192e325 | 2007-10-03 21:16:08 +0000 | [diff] [blame] | 999 | |
Chris Lattner | fe4151e | 2006-02-10 23:16:39 +0000 | [diff] [blame] | 1000 | // The exit blocks may have been changed due to edge splitting, recompute. |
| 1001 | ExitBlocks.clear(); |
Devang Patel | f489d0f | 2006-08-29 22:29:16 +0000 | [diff] [blame] | 1002 | L->getUniqueExitBlocks(ExitBlocks); |
| 1003 | |
Chris Lattner | fe4151e | 2006-02-10 23:16:39 +0000 | [diff] [blame] | 1004 | // Add exit blocks to the loop blocks. |
| 1005 | LoopBlocks.insert(LoopBlocks.end(), ExitBlocks.begin(), ExitBlocks.end()); |
Chris Lattner | f48f777 | 2004-04-19 18:07:02 +0000 | [diff] [blame] | 1006 | |
| 1007 | // Next step, clone all of the basic blocks that make up the loop (including |
| 1008 | // the loop preheader and exit blocks), keeping track of the mapping between |
| 1009 | // the instructions and blocks. |
Chris Lattner | f48f777 | 2004-04-19 18:07:02 +0000 | [diff] [blame] | 1010 | NewBlocks.reserve(LoopBlocks.size()); |
Rafael Espindola | 229e38f | 2010-10-13 01:36:30 +0000 | [diff] [blame] | 1011 | ValueToValueMapTy VMap; |
Chris Lattner | f48f777 | 2004-04-19 18:07:02 +0000 | [diff] [blame] | 1012 | for (unsigned i = 0, e = LoopBlocks.size(); i != e; ++i) { |
Devang Patel | 0dc3c2d | 2010-06-24 00:33:28 +0000 | [diff] [blame] | 1013 | BasicBlock *NewBB = CloneBasicBlock(LoopBlocks[i], VMap, ".us", F); |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 1014 | |
Evan Cheng | ba93044 | 2010-04-05 21:16:25 +0000 | [diff] [blame] | 1015 | NewBlocks.push_back(NewBB); |
Devang Patel | 0dc3c2d | 2010-06-24 00:33:28 +0000 | [diff] [blame] | 1016 | VMap[LoopBlocks[i]] = NewBB; // Keep the BB mapping. |
Evan Cheng | ba93044 | 2010-04-05 21:16:25 +0000 | [diff] [blame] | 1017 | LPM->cloneBasicBlockSimpleAnalysis(LoopBlocks[i], NewBB, L); |
Chris Lattner | f48f777 | 2004-04-19 18:07:02 +0000 | [diff] [blame] | 1018 | } |
| 1019 | |
| 1020 | // Splice the newly inserted blocks into the function right before the |
| 1021 | // original preheader. |
Evan Cheng | ba93044 | 2010-04-05 21:16:25 +0000 | [diff] [blame] | 1022 | F->getBasicBlockList().splice(NewPreheader, F->getBasicBlockList(), |
Chris Lattner | f48f777 | 2004-04-19 18:07:02 +0000 | [diff] [blame] | 1023 | NewBlocks[0], F->end()); |
| 1024 | |
Hal Finkel | 74c2f35 | 2014-09-07 12:44:26 +0000 | [diff] [blame] | 1025 | // FIXME: We could register any cloned assumptions instead of clearing the |
| 1026 | // whole function's cache. |
Chandler Carruth | 66b3130 | 2015-01-04 12:03:27 +0000 | [diff] [blame] | 1027 | AC->clear(); |
Hal Finkel | 74c2f35 | 2014-09-07 12:44:26 +0000 | [diff] [blame] | 1028 | |
Chris Lattner | f48f777 | 2004-04-19 18:07:02 +0000 | [diff] [blame] | 1029 | // Now we create the new Loop object for the versioned loop. |
Devang Patel | 0dc3c2d | 2010-06-24 00:33:28 +0000 | [diff] [blame] | 1030 | Loop *NewLoop = CloneLoop(L, L->getParentLoop(), VMap, LI, LPM); |
Stepan Dyatkovskiy | cb2adbac | 2012-01-15 09:44:07 +0000 | [diff] [blame] | 1031 | |
| 1032 | // Recalculate unswitching quota, inherit simplified switches info for NewBB, |
| 1033 | // Probably clone more loop-unswitch related loop properties. |
| 1034 | BranchesInfo.cloneData(NewLoop, L, VMap); |
| 1035 | |
Chris Lattner | f1b1516 | 2006-02-10 23:26:14 +0000 | [diff] [blame] | 1036 | Loop *ParentLoop = L->getParentLoop(); |
| 1037 | if (ParentLoop) { |
Chris Lattner | f48f777 | 2004-04-19 18:07:02 +0000 | [diff] [blame] | 1038 | // Make sure to add the cloned preheader and exit blocks to the parent loop |
| 1039 | // as well. |
Chandler Carruth | 691addc | 2015-01-18 01:25:51 +0000 | [diff] [blame] | 1040 | ParentLoop->addBasicBlockToLoop(NewBlocks[0], *LI); |
Chris Lattner | f1b1516 | 2006-02-10 23:26:14 +0000 | [diff] [blame] | 1041 | } |
Bill Wendling | 90f90da | 2011-09-27 00:59:31 +0000 | [diff] [blame] | 1042 | |
Chris Lattner | f1b1516 | 2006-02-10 23:26:14 +0000 | [diff] [blame] | 1043 | for (unsigned i = 0, e = ExitBlocks.size(); i != e; ++i) { |
Devang Patel | 0dc3c2d | 2010-06-24 00:33:28 +0000 | [diff] [blame] | 1044 | BasicBlock *NewExit = cast<BasicBlock>(VMap[ExitBlocks[i]]); |
Chris Lattner | 8e44ff5 | 2006-02-18 00:55:32 +0000 | [diff] [blame] | 1045 | // The new exit block should be in the same loop as the old one. |
| 1046 | if (Loop *ExitBBLoop = LI->getLoopFor(ExitBlocks[i])) |
Chandler Carruth | 691addc | 2015-01-18 01:25:51 +0000 | [diff] [blame] | 1047 | ExitBBLoop->addBasicBlockToLoop(NewExit, *LI); |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 1048 | |
Chris Lattner | f1b1516 | 2006-02-10 23:26:14 +0000 | [diff] [blame] | 1049 | assert(NewExit->getTerminator()->getNumSuccessors() == 1 && |
| 1050 | "Exit block should have been split to have one successor!"); |
| 1051 | BasicBlock *ExitSucc = NewExit->getTerminator()->getSuccessor(0); |
Devang Patel | eb611dd | 2008-07-03 17:37:52 +0000 | [diff] [blame] | 1052 | |
Chris Lattner | f1b1516 | 2006-02-10 23:26:14 +0000 | [diff] [blame] | 1053 | // If the successor of the exit block had PHI nodes, add an entry for |
| 1054 | // NewExit. |
Jakub Staszak | 27da123 | 2013-08-06 17:03:42 +0000 | [diff] [blame] | 1055 | for (BasicBlock::iterator I = ExitSucc->begin(); |
| 1056 | PHINode *PN = dyn_cast<PHINode>(I); ++I) { |
Chris Lattner | f1b1516 | 2006-02-10 23:26:14 +0000 | [diff] [blame] | 1057 | Value *V = PN->getIncomingValueForBlock(ExitBlocks[i]); |
Rafael Espindola | 229e38f | 2010-10-13 01:36:30 +0000 | [diff] [blame] | 1058 | ValueToValueMapTy::iterator It = VMap.find(V); |
Devang Patel | 0dc3c2d | 2010-06-24 00:33:28 +0000 | [diff] [blame] | 1059 | if (It != VMap.end()) V = It->second; |
Chris Lattner | f1b1516 | 2006-02-10 23:26:14 +0000 | [diff] [blame] | 1060 | PN->addIncoming(V, NewExit); |
| 1061 | } |
Bill Wendling | 90f90da | 2011-09-27 00:59:31 +0000 | [diff] [blame] | 1062 | |
| 1063 | if (LandingPadInst *LPad = NewExit->getLandingPadInst()) { |
Jakub Staszak | 27da123 | 2013-08-06 17:03:42 +0000 | [diff] [blame] | 1064 | PHINode *PN = PHINode::Create(LPad->getType(), 0, "", |
| 1065 | ExitSucc->getFirstInsertionPt()); |
Bill Wendling | 90f90da | 2011-09-27 00:59:31 +0000 | [diff] [blame] | 1066 | |
Duncan P. N. Exon Smith | 6c99015 | 2014-07-21 17:06:51 +0000 | [diff] [blame] | 1067 | for (pred_iterator I = pred_begin(ExitSucc), E = pred_end(ExitSucc); |
| 1068 | I != E; ++I) { |
| 1069 | BasicBlock *BB = *I; |
Bill Wendling | 90f90da | 2011-09-27 00:59:31 +0000 | [diff] [blame] | 1070 | LandingPadInst *LPI = BB->getLandingPadInst(); |
| 1071 | LPI->replaceAllUsesWith(PN); |
| 1072 | PN->addIncoming(LPI, BB); |
| 1073 | } |
| 1074 | } |
Chris Lattner | f48f777 | 2004-04-19 18:07:02 +0000 | [diff] [blame] | 1075 | } |
| 1076 | |
| 1077 | // Rewrite the code to refer to itself. |
Nick Lewycky | 4d43d3c | 2008-04-25 16:53:59 +0000 | [diff] [blame] | 1078 | for (unsigned i = 0, e = NewBlocks.size(); i != e; ++i) |
| 1079 | for (BasicBlock::iterator I = NewBlocks[i]->begin(), |
| 1080 | E = NewBlocks[i]->end(); I != E; ++I) |
Chris Lattner | 43f8d16 | 2011-01-08 08:15:20 +0000 | [diff] [blame] | 1081 | RemapInstruction(I, VMap,RF_NoModuleLevelChanges|RF_IgnoreMissingEntries); |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 1082 | |
Chris Lattner | f48f777 | 2004-04-19 18:07:02 +0000 | [diff] [blame] | 1083 | // Rewrite the original preheader to select between versions of the loop. |
Devang Patel | e149d4e | 2008-07-02 01:18:13 +0000 | [diff] [blame] | 1084 | BranchInst *OldBR = cast<BranchInst>(loopPreheader->getTerminator()); |
Chris Lattner | b0cbe71 | 2006-02-15 00:07:43 +0000 | [diff] [blame] | 1085 | assert(OldBR->isUnconditional() && OldBR->getSuccessor(0) == LoopBlocks[0] && |
Chris Lattner | f48f777 | 2004-04-19 18:07:02 +0000 | [diff] [blame] | 1086 | "Preheader splitting did not work correctly!"); |
Chris Lattner | f48f777 | 2004-04-19 18:07:02 +0000 | [diff] [blame] | 1087 | |
Chris Lattner | b0cbe71 | 2006-02-15 00:07:43 +0000 | [diff] [blame] | 1088 | // Emit the new branch that selects between the two versions of this loop. |
Weiming Zhao | f1abad5 | 2015-06-23 05:31:09 +0000 | [diff] [blame] | 1089 | EmitPreheaderBranchOnCondition(LIC, Val, NewBlocks[0], LoopBlocks[0], OldBR, |
| 1090 | TI); |
Devang Patel | d491198 | 2007-07-31 08:03:26 +0000 | [diff] [blame] | 1091 | LPM->deleteSimpleAnalysisValue(OldBR, L); |
Devang Patel | 83cc3f8 | 2007-09-20 23:45:50 +0000 | [diff] [blame] | 1092 | OldBR->eraseFromParent(); |
Devang Patel | a882328 | 2007-08-02 15:25:57 +0000 | [diff] [blame] | 1093 | |
Chris Lattner | c2e3a7a | 2006-02-18 07:57:38 +0000 | [diff] [blame] | 1094 | LoopProcessWorklist.push_back(NewLoop); |
Devang Patel | 7d165e1 | 2007-07-30 23:07:10 +0000 | [diff] [blame] | 1095 | redoLoop = true; |
Chris Lattner | f48f777 | 2004-04-19 18:07:02 +0000 | [diff] [blame] | 1096 | |
Chris Lattner | 5814d9d9 | 2010-04-20 05:09:16 +0000 | [diff] [blame] | 1097 | // Keep a WeakVH holding onto LIC. If the first call to RewriteLoopBody |
| 1098 | // deletes the instruction (for example by simplifying a PHI that feeds into |
| 1099 | // the condition that we're unswitching on), we don't rewrite the second |
| 1100 | // iteration. |
| 1101 | WeakVH LICHandle(LIC); |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 1102 | |
Chris Lattner | f48f777 | 2004-04-19 18:07:02 +0000 | [diff] [blame] | 1103 | // Now we rewrite the original code to know that the condition is true and the |
| 1104 | // new code to know that the condition is false. |
Evan Cheng | ba93044 | 2010-04-05 21:16:25 +0000 | [diff] [blame] | 1105 | RewriteLoopBodyWithConditionConstant(L, LIC, Val, false); |
Devang Patel | eb611dd | 2008-07-03 17:37:52 +0000 | [diff] [blame] | 1106 | |
Chris Lattner | 5814d9d9 | 2010-04-20 05:09:16 +0000 | [diff] [blame] | 1107 | // It's possible that simplifying one loop could cause the other to be |
| 1108 | // changed to another value or a constant. If its a constant, don't simplify |
| 1109 | // it. |
| 1110 | if (!LoopProcessWorklist.empty() && LoopProcessWorklist.back() == NewLoop && |
| 1111 | LICHandle && !isa<Constant>(LICHandle)) |
| 1112 | RewriteLoopBodyWithConditionConstant(NewLoop, LICHandle, Val, true); |
Chris Lattner | f48f777 | 2004-04-19 18:07:02 +0000 | [diff] [blame] | 1113 | } |
| 1114 | |
Sanjay Patel | 956e29c | 2015-08-11 21:24:04 +0000 | [diff] [blame] | 1115 | /// Remove all instances of I from the worklist vector specified. |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 1116 | static void RemoveFromWorklist(Instruction *I, |
Chris Lattner | 6fd1362 | 2006-02-17 00:31:07 +0000 | [diff] [blame] | 1117 | std::vector<Instruction*> &Worklist) { |
Jakub Staszak | 8f46e91 | 2012-10-16 19:52:32 +0000 | [diff] [blame] | 1118 | |
| 1119 | Worklist.erase(std::remove(Worklist.begin(), Worklist.end(), I), |
| 1120 | Worklist.end()); |
Chris Lattner | 6fd1362 | 2006-02-17 00:31:07 +0000 | [diff] [blame] | 1121 | } |
| 1122 | |
Sanjay Patel | 956e29c | 2015-08-11 21:24:04 +0000 | [diff] [blame] | 1123 | /// When we find that I really equals V, remove I from the |
Chris Lattner | 6fd1362 | 2006-02-17 00:31:07 +0000 | [diff] [blame] | 1124 | /// program, replacing all uses with V and update the worklist. |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 1125 | static void ReplaceUsesOfWith(Instruction *I, Value *V, |
Devang Patel | d491198 | 2007-07-31 08:03:26 +0000 | [diff] [blame] | 1126 | std::vector<Instruction*> &Worklist, |
| 1127 | Loop *L, LPPassManager *LPM) { |
David Greene | d9c355d | 2010-01-05 01:27:04 +0000 | [diff] [blame] | 1128 | DEBUG(dbgs() << "Replace with '" << *V << "': " << *I); |
Chris Lattner | 6fd1362 | 2006-02-17 00:31:07 +0000 | [diff] [blame] | 1129 | |
| 1130 | // Add uses to the worklist, which may be dead now. |
| 1131 | for (unsigned i = 0, e = I->getNumOperands(); i != e; ++i) |
| 1132 | if (Instruction *Use = dyn_cast<Instruction>(I->getOperand(i))) |
| 1133 | Worklist.push_back(Use); |
| 1134 | |
| 1135 | // Add users to the worklist which may be simplified now. |
Chandler Carruth | cdf4788 | 2014-03-09 03:16:01 +0000 | [diff] [blame] | 1136 | for (User *U : I->users()) |
| 1137 | Worklist.push_back(cast<Instruction>(U)); |
Devang Patel | d491198 | 2007-07-31 08:03:26 +0000 | [diff] [blame] | 1138 | LPM->deleteSimpleAnalysisValue(I, L); |
Chris Lattner | 6fd1362 | 2006-02-17 00:31:07 +0000 | [diff] [blame] | 1139 | RemoveFromWorklist(I, Worklist); |
Devang Patel | 83cc3f8 | 2007-09-20 23:45:50 +0000 | [diff] [blame] | 1140 | I->replaceAllUsesWith(V); |
| 1141 | I->eraseFromParent(); |
Chris Lattner | 6fd1362 | 2006-02-17 00:31:07 +0000 | [diff] [blame] | 1142 | ++NumSimplify; |
| 1143 | } |
| 1144 | |
Sanjay Patel | 956e29c | 2015-08-11 21:24:04 +0000 | [diff] [blame] | 1145 | /// We know either that the value LIC has the value specified by Val in the |
| 1146 | /// specified loop, or we know it does NOT have that value. |
| 1147 | /// Rewrite any uses of LIC or of properties correlated to it. |
Chris Lattner | f48f777 | 2004-04-19 18:07:02 +0000 | [diff] [blame] | 1148 | void LoopUnswitch::RewriteLoopBodyWithConditionConstant(Loop *L, Value *LIC, |
Chris Lattner | fbadd7e | 2006-02-11 00:43:37 +0000 | [diff] [blame] | 1149 | Constant *Val, |
| 1150 | bool IsEqual) { |
Chris Lattner | ed7a67b | 2006-02-10 01:24:09 +0000 | [diff] [blame] | 1151 | assert(!isa<Constant>(LIC) && "Why are we unswitching on a constant?"); |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 1152 | |
Chris Lattner | f48f777 | 2004-04-19 18:07:02 +0000 | [diff] [blame] | 1153 | // FIXME: Support correlated properties, like: |
| 1154 | // for (...) |
| 1155 | // if (li1 < li2) |
| 1156 | // ... |
| 1157 | // if (li1 > li2) |
| 1158 | // ... |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 1159 | |
Chris Lattner | 6e26315 | 2006-02-10 02:30:37 +0000 | [diff] [blame] | 1160 | // FOLD boolean conditions (X|LIC), (X&LIC). Fold conditional branches, |
| 1161 | // selects, switches. |
Chris Lattner | 6fd1362 | 2006-02-17 00:31:07 +0000 | [diff] [blame] | 1162 | std::vector<Instruction*> Worklist; |
Owen Anderson | 47db941 | 2009-07-22 00:24:57 +0000 | [diff] [blame] | 1163 | LLVMContext &Context = Val->getContext(); |
| 1164 | |
Chris Lattner | 6fd1362 | 2006-02-17 00:31:07 +0000 | [diff] [blame] | 1165 | // If we know that LIC == Val, or that LIC == NotVal, just replace uses of LIC |
| 1166 | // in the loop with the appropriate one directly. |
Owen Anderson | 55f1c09 | 2009-08-13 21:58:54 +0000 | [diff] [blame] | 1167 | if (IsEqual || (isa<ConstantInt>(Val) && |
Duncan Sands | 9dff9be | 2010-02-15 16:12:20 +0000 | [diff] [blame] | 1168 | Val->getType()->isIntegerTy(1))) { |
Chris Lattner | 8a5a324 | 2006-02-22 06:37:14 +0000 | [diff] [blame] | 1169 | Value *Replacement; |
| 1170 | if (IsEqual) |
| 1171 | Replacement = Val; |
| 1172 | else |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 1173 | Replacement = ConstantInt::get(Type::getInt1Ty(Val->getContext()), |
Reid Spencer | cddc9df | 2007-01-12 04:24:46 +0000 | [diff] [blame] | 1174 | !cast<ConstantInt>(Val)->getZExtValue()); |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 1175 | |
Chandler Carruth | cdf4788 | 2014-03-09 03:16:01 +0000 | [diff] [blame] | 1176 | for (User *U : LIC->users()) { |
| 1177 | Instruction *UI = dyn_cast<Instruction>(U); |
| 1178 | if (!UI || !L->contains(UI)) |
Evan Cheng | 1b55f56 | 2011-05-24 23:12:57 +0000 | [diff] [blame] | 1179 | continue; |
Chandler Carruth | cdf4788 | 2014-03-09 03:16:01 +0000 | [diff] [blame] | 1180 | Worklist.push_back(UI); |
Evan Cheng | 1b55f56 | 2011-05-24 23:12:57 +0000 | [diff] [blame] | 1181 | } |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 1182 | |
Jakub Staszak | 27da123 | 2013-08-06 17:03:42 +0000 | [diff] [blame] | 1183 | for (std::vector<Instruction*>::iterator UI = Worklist.begin(), |
| 1184 | UE = Worklist.end(); UI != UE; ++UI) |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 1185 | (*UI)->replaceUsesOfWith(LIC, Replacement); |
| 1186 | |
Chris Lattner | c832c1b | 2010-04-05 21:18:32 +0000 | [diff] [blame] | 1187 | SimplifyCode(Worklist, L); |
| 1188 | return; |
| 1189 | } |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 1190 | |
Chris Lattner | c832c1b | 2010-04-05 21:18:32 +0000 | [diff] [blame] | 1191 | // Otherwise, we don't know the precise value of LIC, but we do know that it |
| 1192 | // is certainly NOT "Val". As such, simplify any uses in the loop that we |
| 1193 | // can. This case occurs when we unswitch switch statements. |
Chandler Carruth | cdf4788 | 2014-03-09 03:16:01 +0000 | [diff] [blame] | 1194 | for (User *U : LIC->users()) { |
| 1195 | Instruction *UI = dyn_cast<Instruction>(U); |
| 1196 | if (!UI || !L->contains(UI)) |
Chris Lattner | c832c1b | 2010-04-05 21:18:32 +0000 | [diff] [blame] | 1197 | continue; |
Chris Lattner | 6fd1362 | 2006-02-17 00:31:07 +0000 | [diff] [blame] | 1198 | |
Chandler Carruth | cdf4788 | 2014-03-09 03:16:01 +0000 | [diff] [blame] | 1199 | Worklist.push_back(UI); |
Chris Lattner | 6fd1362 | 2006-02-17 00:31:07 +0000 | [diff] [blame] | 1200 | |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 1201 | // TODO: We could do other simplifications, for example, turning |
Chris Lattner | c832c1b | 2010-04-05 21:18:32 +0000 | [diff] [blame] | 1202 | // 'icmp eq LIC, Val' -> false. |
| 1203 | |
| 1204 | // If we know that LIC is not Val, use this info to simplify code. |
Chandler Carruth | cdf4788 | 2014-03-09 03:16:01 +0000 | [diff] [blame] | 1205 | SwitchInst *SI = dyn_cast<SwitchInst>(UI); |
Craig Topper | f40110f | 2014-04-25 05:29:35 +0000 | [diff] [blame] | 1206 | if (!SI || !isa<ConstantInt>(Val)) continue; |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 1207 | |
Stepan Dyatkovskiy | 5b648af | 2012-03-08 07:06:20 +0000 | [diff] [blame] | 1208 | SwitchInst::CaseIt DeadCase = SI->findCaseValue(cast<ConstantInt>(Val)); |
Stepan Dyatkovskiy | 513aaa5 | 2012-02-01 07:49:51 +0000 | [diff] [blame] | 1209 | // Default case is live for multiple values. |
Stepan Dyatkovskiy | 97b02fc | 2012-03-11 06:09:17 +0000 | [diff] [blame] | 1210 | if (DeadCase == SI->case_default()) continue; |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 1211 | |
| 1212 | // Found a dead case value. Don't remove PHI nodes in the |
Chris Lattner | c832c1b | 2010-04-05 21:18:32 +0000 | [diff] [blame] | 1213 | // successor if they become single-entry, those PHI nodes may |
| 1214 | // be in the Users list. |
Nick Lewycky | 6115824 | 2011-06-03 06:27:15 +0000 | [diff] [blame] | 1215 | |
Evan Cheng | 1b55f56 | 2011-05-24 23:12:57 +0000 | [diff] [blame] | 1216 | BasicBlock *Switch = SI->getParent(); |
Stepan Dyatkovskiy | 5b648af | 2012-03-08 07:06:20 +0000 | [diff] [blame] | 1217 | BasicBlock *SISucc = DeadCase.getCaseSuccessor(); |
Evan Cheng | 1b55f56 | 2011-05-24 23:12:57 +0000 | [diff] [blame] | 1218 | BasicBlock *Latch = L->getLoopLatch(); |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 1219 | |
Stepan Dyatkovskiy | cb2adbac | 2012-01-15 09:44:07 +0000 | [diff] [blame] | 1220 | BranchesInfo.setUnswitched(SI, Val); |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 1221 | |
Nick Lewycky | 6115824 | 2011-06-03 06:27:15 +0000 | [diff] [blame] | 1222 | if (!SI->findCaseDest(SISucc)) continue; // Edge is critical. |
Evan Cheng | 9605a69 | 2011-05-25 18:17:13 +0000 | [diff] [blame] | 1223 | // If the DeadCase successor dominates the loop latch, then the |
| 1224 | // transformation isn't safe since it will delete the sole predecessor edge |
| 1225 | // to the latch. |
| 1226 | if (Latch && DT->dominates(SISucc, Latch)) |
| 1227 | continue; |
Evan Cheng | 1b55f56 | 2011-05-24 23:12:57 +0000 | [diff] [blame] | 1228 | |
Chris Lattner | c832c1b | 2010-04-05 21:18:32 +0000 | [diff] [blame] | 1229 | // FIXME: This is a hack. We need to keep the successor around |
| 1230 | // and hooked up so as to preserve the loop structure, because |
| 1231 | // trying to update it is complicated. So instead we preserve the |
| 1232 | // loop structure and put the block on a dead code path. |
Chandler Carruth | d450056 | 2015-01-19 12:36:53 +0000 | [diff] [blame] | 1233 | SplitEdge(Switch, SISucc, DT, LI); |
Chris Lattner | c832c1b | 2010-04-05 21:18:32 +0000 | [diff] [blame] | 1234 | // Compute the successors instead of relying on the return value |
| 1235 | // of SplitEdge, since it may have split the switch successor |
| 1236 | // after PHI nodes. |
Stepan Dyatkovskiy | 5b648af | 2012-03-08 07:06:20 +0000 | [diff] [blame] | 1237 | BasicBlock *NewSISucc = DeadCase.getCaseSuccessor(); |
Chris Lattner | c832c1b | 2010-04-05 21:18:32 +0000 | [diff] [blame] | 1238 | BasicBlock *OldSISucc = *succ_begin(NewSISucc); |
| 1239 | // Create an "unreachable" destination. |
| 1240 | BasicBlock *Abort = BasicBlock::Create(Context, "us-unreachable", |
| 1241 | Switch->getParent(), |
| 1242 | OldSISucc); |
| 1243 | new UnreachableInst(Context, Abort); |
| 1244 | // Force the new case destination to branch to the "unreachable" |
| 1245 | // block while maintaining a (dead) CFG edge to the old block. |
| 1246 | NewSISucc->getTerminator()->eraseFromParent(); |
| 1247 | BranchInst::Create(Abort, OldSISucc, |
| 1248 | ConstantInt::getTrue(Context), NewSISucc); |
| 1249 | // Release the PHI operands for this edge. |
| 1250 | for (BasicBlock::iterator II = NewSISucc->begin(); |
| 1251 | PHINode *PN = dyn_cast<PHINode>(II); ++II) |
| 1252 | PN->setIncomingValue(PN->getBasicBlockIndex(Switch), |
| 1253 | UndefValue::get(PN->getType())); |
| 1254 | // Tell the domtree about the new block. We don't fully update the |
| 1255 | // domtree here -- instead we force it to do a full recomputation |
| 1256 | // after the pass is complete -- but we do need to inform it of |
| 1257 | // new blocks. |
Michael Zolotukhin | 9f3aea6 | 2015-09-22 00:22:47 +0000 | [diff] [blame] | 1258 | DT->addNewBlock(Abort, NewSISucc); |
Chris Lattner | 6fd1362 | 2006-02-17 00:31:07 +0000 | [diff] [blame] | 1259 | } |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 1260 | |
Devang Patel | d491198 | 2007-07-31 08:03:26 +0000 | [diff] [blame] | 1261 | SimplifyCode(Worklist, L); |
Chris Lattner | c2e3a7a | 2006-02-18 07:57:38 +0000 | [diff] [blame] | 1262 | } |
| 1263 | |
Sanjay Patel | 956e29c | 2015-08-11 21:24:04 +0000 | [diff] [blame] | 1264 | /// Now that we have simplified some instructions in the loop, walk over it and |
| 1265 | /// constant prop, dce, and fold control flow where possible. Note that this is |
| 1266 | /// effectively a very simple loop-structure-aware optimizer. During processing |
| 1267 | /// of this loop, L could very well be deleted, so it must not be used. |
Chris Lattner | c2e3a7a | 2006-02-18 07:57:38 +0000 | [diff] [blame] | 1268 | /// |
| 1269 | /// FIXME: When the loop optimizer is more mature, separate this out to a new |
| 1270 | /// pass. |
| 1271 | /// |
Devang Patel | d491198 | 2007-07-31 08:03:26 +0000 | [diff] [blame] | 1272 | void LoopUnswitch::SimplifyCode(std::vector<Instruction*> &Worklist, Loop *L) { |
Mehdi Amini | a28d91d | 2015-03-10 02:37:25 +0000 | [diff] [blame] | 1273 | const DataLayout &DL = L->getHeader()->getModule()->getDataLayout(); |
Chris Lattner | 6fd1362 | 2006-02-17 00:31:07 +0000 | [diff] [blame] | 1274 | while (!Worklist.empty()) { |
| 1275 | Instruction *I = Worklist.back(); |
| 1276 | Worklist.pop_back(); |
Duncan Sands | bb2cd02 | 2010-11-23 20:24:21 +0000 | [diff] [blame] | 1277 | |
Chris Lattner | 6fd1362 | 2006-02-17 00:31:07 +0000 | [diff] [blame] | 1278 | // Simple DCE. |
| 1279 | if (isInstructionTriviallyDead(I)) { |
David Greene | d9c355d | 2010-01-05 01:27:04 +0000 | [diff] [blame] | 1280 | DEBUG(dbgs() << "Remove dead instruction '" << *I); |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 1281 | |
Chris Lattner | 6fd1362 | 2006-02-17 00:31:07 +0000 | [diff] [blame] | 1282 | // Add uses to the worklist, which may be dead now. |
| 1283 | for (unsigned i = 0, e = I->getNumOperands(); i != e; ++i) |
| 1284 | if (Instruction *Use = dyn_cast<Instruction>(I->getOperand(i))) |
| 1285 | Worklist.push_back(Use); |
Devang Patel | d491198 | 2007-07-31 08:03:26 +0000 | [diff] [blame] | 1286 | LPM->deleteSimpleAnalysisValue(I, L); |
Chris Lattner | 6fd1362 | 2006-02-17 00:31:07 +0000 | [diff] [blame] | 1287 | RemoveFromWorklist(I, Worklist); |
Devang Patel | 83cc3f8 | 2007-09-20 23:45:50 +0000 | [diff] [blame] | 1288 | I->eraseFromParent(); |
Chris Lattner | 6fd1362 | 2006-02-17 00:31:07 +0000 | [diff] [blame] | 1289 | ++NumSimplify; |
| 1290 | continue; |
| 1291 | } |
Duncan Sands | aef146b | 2010-11-18 19:59:41 +0000 | [diff] [blame] | 1292 | |
Chris Lattner | 66e809a | 2010-04-20 05:33:18 +0000 | [diff] [blame] | 1293 | // See if instruction simplification can hack this up. This is common for |
| 1294 | // things like "select false, X, Y" after unswitching made the condition be |
Peter Collingbourne | 9a03c73 | 2012-05-20 01:32:09 +0000 | [diff] [blame] | 1295 | // 'false'. TODO: update the domtree properly so we can pass it here. |
Mehdi Amini | a28d91d | 2015-03-10 02:37:25 +0000 | [diff] [blame] | 1296 | if (Value *V = SimplifyInstruction(I, DL)) |
Duncan Sands | aef146b | 2010-11-18 19:59:41 +0000 | [diff] [blame] | 1297 | if (LI->replacementPreservesLCSSAForm(I, V)) { |
| 1298 | ReplaceUsesOfWith(I, V, Worklist, L, LPM); |
| 1299 | continue; |
| 1300 | } |
| 1301 | |
Chris Lattner | 6fd1362 | 2006-02-17 00:31:07 +0000 | [diff] [blame] | 1302 | // Special case hacks that appear commonly in unswitched code. |
Chris Lattner | 66e809a | 2010-04-20 05:33:18 +0000 | [diff] [blame] | 1303 | if (BranchInst *BI = dyn_cast<BranchInst>(I)) { |
Chris Lattner | 6fd1362 | 2006-02-17 00:31:07 +0000 | [diff] [blame] | 1304 | if (BI->isUnconditional()) { |
| 1305 | // If BI's parent is the only pred of the successor, fold the two blocks |
| 1306 | // together. |
| 1307 | BasicBlock *Pred = BI->getParent(); |
| 1308 | BasicBlock *Succ = BI->getSuccessor(0); |
| 1309 | BasicBlock *SinglePred = Succ->getSinglePredecessor(); |
| 1310 | if (!SinglePred) continue; // Nothing to do. |
| 1311 | assert(SinglePred == Pred && "CFG broken"); |
| 1312 | |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 1313 | DEBUG(dbgs() << "Merging blocks: " << Pred->getName() << " <- " |
Daniel Dunbar | 0dd5e1e | 2009-07-25 00:23:56 +0000 | [diff] [blame] | 1314 | << Succ->getName() << "\n"); |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 1315 | |
Chris Lattner | 6fd1362 | 2006-02-17 00:31:07 +0000 | [diff] [blame] | 1316 | // Resolve any single entry PHI nodes in Succ. |
| 1317 | while (PHINode *PN = dyn_cast<PHINode>(Succ->begin())) |
Devang Patel | d491198 | 2007-07-31 08:03:26 +0000 | [diff] [blame] | 1318 | ReplaceUsesOfWith(PN, PN->getIncomingValue(0), Worklist, L, LPM); |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 1319 | |
Jay Foad | 61ea0e4 | 2011-06-23 09:09:15 +0000 | [diff] [blame] | 1320 | // If Succ has any successors with PHI nodes, update them to have |
| 1321 | // entries coming from Pred instead of Succ. |
| 1322 | Succ->replaceAllUsesWith(Pred); |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 1323 | |
Chris Lattner | 6fd1362 | 2006-02-17 00:31:07 +0000 | [diff] [blame] | 1324 | // Move all of the successor contents from Succ to Pred. |
| 1325 | Pred->getInstList().splice(BI, Succ->getInstList(), Succ->begin(), |
| 1326 | Succ->end()); |
Devang Patel | d491198 | 2007-07-31 08:03:26 +0000 | [diff] [blame] | 1327 | LPM->deleteSimpleAnalysisValue(BI, L); |
Devang Patel | 83cc3f8 | 2007-09-20 23:45:50 +0000 | [diff] [blame] | 1328 | BI->eraseFromParent(); |
Chris Lattner | 6fd1362 | 2006-02-17 00:31:07 +0000 | [diff] [blame] | 1329 | RemoveFromWorklist(BI, Worklist); |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 1330 | |
Chris Lattner | 6fd1362 | 2006-02-17 00:31:07 +0000 | [diff] [blame] | 1331 | // Remove Succ from the loop tree. |
| 1332 | LI->removeBlock(Succ); |
Devang Patel | d491198 | 2007-07-31 08:03:26 +0000 | [diff] [blame] | 1333 | LPM->deleteSimpleAnalysisValue(Succ, L); |
Devang Patel | 83cc3f8 | 2007-09-20 23:45:50 +0000 | [diff] [blame] | 1334 | Succ->eraseFromParent(); |
Chris Lattner | 29f771b | 2006-02-18 01:27:45 +0000 | [diff] [blame] | 1335 | ++NumSimplify; |
Chris Lattner | 66e809a | 2010-04-20 05:33:18 +0000 | [diff] [blame] | 1336 | continue; |
Chris Lattner | c832c1b | 2010-04-05 21:18:32 +0000 | [diff] [blame] | 1337 | } |
Andrew Trick | 4104ed9 | 2012-04-10 05:14:37 +0000 | [diff] [blame] | 1338 | |
Chris Lattner | 66e809a | 2010-04-20 05:33:18 +0000 | [diff] [blame] | 1339 | continue; |
Chris Lattner | 6fd1362 | 2006-02-17 00:31:07 +0000 | [diff] [blame] | 1340 | } |
| 1341 | } |
Chris Lattner | f48f777 | 2004-04-19 18:07:02 +0000 | [diff] [blame] | 1342 | } |