Chris Lattner | 67a9801 | 2003-10-12 21:44:18 +0000 | [diff] [blame] | 1 | //===- LoopSimplify.cpp - Loop Canonicalization Pass ----------------------===// |
Misha Brukman | fd93908 | 2005-04-21 23:48:37 +0000 | [diff] [blame] | 2 | // |
John Criswell | b576c94 | 2003-10-20 19:43:21 +0000 | [diff] [blame] | 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
Chris Lattner | 4ee451d | 2007-12-29 20:36:04 +0000 | [diff] [blame] | 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
Misha Brukman | fd93908 | 2005-04-21 23:48:37 +0000 | [diff] [blame] | 7 | // |
John Criswell | b576c94 | 2003-10-20 19:43:21 +0000 | [diff] [blame] | 8 | //===----------------------------------------------------------------------===// |
Chris Lattner | 38acf9e | 2002-09-26 16:17:31 +0000 | [diff] [blame] | 9 | // |
Chris Lattner | ee2c50c | 2003-10-12 21:43:28 +0000 | [diff] [blame] | 10 | // This pass performs several transformations to transform natural loops into a |
| 11 | // simpler form, which makes subsequent analyses and transformations simpler and |
| 12 | // more effective. |
Chris Lattner | dbf3cd7 | 2003-02-27 20:27:08 +0000 | [diff] [blame] | 13 | // |
| 14 | // Loop pre-header insertion guarantees that there is a single, non-critical |
| 15 | // entry edge from outside of the loop to the loop header. This simplifies a |
| 16 | // number of analyses and transformations, such as LICM. |
| 17 | // |
| 18 | // Loop exit-block insertion guarantees that all exit blocks from the loop |
| 19 | // (blocks which are outside of the loop that have predecessors inside of the |
Chris Lattner | 66ea98e | 2003-12-10 17:20:35 +0000 | [diff] [blame] | 20 | // loop) only have predecessors from inside of the loop (and are thus dominated |
| 21 | // by the loop header). This simplifies transformations such as store-sinking |
| 22 | // that are built into LICM. |
Chris Lattner | dbf3cd7 | 2003-02-27 20:27:08 +0000 | [diff] [blame] | 23 | // |
Chris Lattner | 2ab6a73 | 2003-10-13 00:37:13 +0000 | [diff] [blame] | 24 | // This pass also guarantees that loops will have exactly one backedge. |
| 25 | // |
Dan Gohman | f4e82d1 | 2009-11-05 21:14:46 +0000 | [diff] [blame] | 26 | // Indirectbr instructions introduce several complications. If the loop |
| 27 | // contains or is entered by an indirectbr instruction, it may not be possible |
| 28 | // to transform the loop and make these guarantees. Client code should check |
| 29 | // that these conditions are true before relying on them. |
| 30 | // |
Chris Lattner | dbf3cd7 | 2003-02-27 20:27:08 +0000 | [diff] [blame] | 31 | // Note that the simplifycfg pass will clean up blocks which are split out but |
Chris Lattner | ee2c50c | 2003-10-12 21:43:28 +0000 | [diff] [blame] | 32 | // end up being unnecessary, so usage of this pass should not pessimize |
| 33 | // generated code. |
| 34 | // |
| 35 | // This pass obviously modifies the CFG, but updates loop information and |
| 36 | // dominator information. |
Chris Lattner | 38acf9e | 2002-09-26 16:17:31 +0000 | [diff] [blame] | 37 | // |
| 38 | //===----------------------------------------------------------------------===// |
| 39 | |
Cameron Zwarich | 4a60b93 | 2011-02-10 23:38:10 +0000 | [diff] [blame] | 40 | #define DEBUG_TYPE "loop-simplify" |
Chris Lattner | 38acf9e | 2002-09-26 16:17:31 +0000 | [diff] [blame] | 41 | #include "llvm/Transforms/Scalar.h" |
Chandler Carruth | d04a8d4 | 2012-12-03 16:50:05 +0000 | [diff] [blame] | 42 | #include "llvm/ADT/DepthFirstIterator.h" |
| 43 | #include "llvm/ADT/SetOperations.h" |
| 44 | #include "llvm/ADT/SetVector.h" |
Stephen Hines | 36b5688 | 2014-04-23 16:57:46 -0700 | [diff] [blame] | 45 | #include "llvm/ADT/SmallVector.h" |
Chandler Carruth | d04a8d4 | 2012-12-03 16:50:05 +0000 | [diff] [blame] | 46 | #include "llvm/ADT/Statistic.h" |
Chris Lattner | cec5b88 | 2005-03-25 06:37:22 +0000 | [diff] [blame] | 47 | #include "llvm/Analysis/AliasAnalysis.h" |
Benjamin Kramer | 8999f47 | 2012-10-26 17:40:50 +0000 | [diff] [blame] | 48 | #include "llvm/Analysis/DependenceAnalysis.h" |
Duncan Sands | cdbd992 | 2010-11-16 17:41:24 +0000 | [diff] [blame] | 49 | #include "llvm/Analysis/InstructionSimplify.h" |
Stephen Hines | 36b5688 | 2014-04-23 16:57:46 -0700 | [diff] [blame] | 50 | #include "llvm/Analysis/LoopInfo.h" |
Duncan Sands | cdbd992 | 2010-11-16 17:41:24 +0000 | [diff] [blame] | 51 | #include "llvm/Analysis/ScalarEvolution.h" |
Stephen Hines | 36b5688 | 2014-04-23 16:57:46 -0700 | [diff] [blame] | 52 | #include "llvm/IR/CFG.h" |
Chandler Carruth | 0b8c9a8 | 2013-01-02 11:36:10 +0000 | [diff] [blame] | 53 | #include "llvm/IR/Constants.h" |
Stephen Hines | 36b5688 | 2014-04-23 16:57:46 -0700 | [diff] [blame] | 54 | #include "llvm/IR/Dominators.h" |
Chandler Carruth | 0b8c9a8 | 2013-01-02 11:36:10 +0000 | [diff] [blame] | 55 | #include "llvm/IR/Function.h" |
| 56 | #include "llvm/IR/Instructions.h" |
| 57 | #include "llvm/IR/IntrinsicInst.h" |
| 58 | #include "llvm/IR/LLVMContext.h" |
| 59 | #include "llvm/IR/Type.h" |
Dan Gohman | c5e49c6 | 2010-03-01 17:55:27 +0000 | [diff] [blame] | 60 | #include "llvm/Support/Debug.h" |
Chandler Carruth | d04a8d4 | 2012-12-03 16:50:05 +0000 | [diff] [blame] | 61 | #include "llvm/Transforms/Utils/BasicBlockUtils.h" |
| 62 | #include "llvm/Transforms/Utils/Local.h" |
Hal Finkel | 4e6b24f | 2013-05-20 20:46:30 +0000 | [diff] [blame] | 63 | #include "llvm/Transforms/Utils/LoopUtils.h" |
Chris Lattner | 66ea98e | 2003-12-10 17:20:35 +0000 | [diff] [blame] | 64 | using namespace llvm; |
Brian Gaeke | d0fde30 | 2003-11-11 22:41:34 +0000 | [diff] [blame] | 65 | |
Chris Lattner | d216e8b | 2006-12-19 22:17:40 +0000 | [diff] [blame] | 66 | STATISTIC(NumInserted, "Number of pre-header or exit blocks inserted"); |
| 67 | STATISTIC(NumNested , "Number of nested loops split out"); |
Chris Lattner | 38acf9e | 2002-09-26 16:17:31 +0000 | [diff] [blame] | 68 | |
Stephen Hines | 36b5688 | 2014-04-23 16:57:46 -0700 | [diff] [blame] | 69 | // If the block isn't already, move the new block to right after some 'outside |
| 70 | // block' block. This prevents the preheader from being placed inside the loop |
| 71 | // body, e.g. when the loop hasn't been rotated. |
| 72 | static void placeSplitBlockCarefully(BasicBlock *NewBB, |
| 73 | SmallVectorImpl<BasicBlock *> &SplitPreds, |
| 74 | Loop *L) { |
| 75 | // Check to see if NewBB is already well placed. |
| 76 | Function::iterator BBI = NewBB; --BBI; |
| 77 | for (unsigned i = 0, e = SplitPreds.size(); i != e; ++i) { |
| 78 | if (&*BBI == SplitPreds[i]) |
| 79 | return; |
| 80 | } |
Devang Patel | 794fd75 | 2007-05-01 21:15:47 +0000 | [diff] [blame] | 81 | |
Stephen Hines | 36b5688 | 2014-04-23 16:57:46 -0700 | [diff] [blame] | 82 | // If it isn't already after an outside block, move it after one. This is |
| 83 | // always good as it makes the uncond branch from the outside block into a |
| 84 | // fall-through. |
Misha Brukman | fd93908 | 2005-04-21 23:48:37 +0000 | [diff] [blame] | 85 | |
Stephen Hines | 36b5688 | 2014-04-23 16:57:46 -0700 | [diff] [blame] | 86 | // Figure out *which* outside block to put this after. Prefer an outside |
| 87 | // block that neighbors a BB actually in the loop. |
| 88 | BasicBlock *FoundBB = 0; |
| 89 | for (unsigned i = 0, e = SplitPreds.size(); i != e; ++i) { |
| 90 | Function::iterator BBI = SplitPreds[i]; |
| 91 | if (++BBI != NewBB->getParent()->end() && |
| 92 | L->contains(BBI)) { |
| 93 | FoundBB = SplitPreds[i]; |
| 94 | break; |
Dan Gohman | d84db11 | 2009-09-28 14:37:51 +0000 | [diff] [blame] | 95 | } |
| 96 | } |
Chris Lattner | 2ef703e | 2004-03-14 03:59:22 +0000 | [diff] [blame] | 97 | |
Stephen Hines | 36b5688 | 2014-04-23 16:57:46 -0700 | [diff] [blame] | 98 | // If our heuristic for a *good* bb to place this after doesn't find |
| 99 | // anything, just pick something. It's likely better than leaving it within |
| 100 | // the loop. |
| 101 | if (!FoundBB) |
| 102 | FoundBB = SplitPreds[0]; |
| 103 | NewBB->moveAfter(FoundBB); |
Chris Lattner | 38acf9e | 2002-09-26 16:17:31 +0000 | [diff] [blame] | 104 | } |
| 105 | |
Chris Lattner | 38acf9e | 2002-09-26 16:17:31 +0000 | [diff] [blame] | 106 | /// InsertPreheaderForLoop - Once we discover that a loop doesn't have a |
| 107 | /// preheader, this method is called to insert one. This method has two phases: |
| 108 | /// preheader insertion and analysis updating. |
| 109 | /// |
Hal Finkel | fc32605 | 2013-05-20 16:47:07 +0000 | [diff] [blame] | 110 | BasicBlock *llvm::InsertPreheaderForLoop(Loop *L, Pass *PP) { |
Chris Lattner | 38acf9e | 2002-09-26 16:17:31 +0000 | [diff] [blame] | 111 | BasicBlock *Header = L->getHeader(); |
| 112 | |
| 113 | // Compute the set of predecessors of the loop that are not in the loop. |
Chris Lattner | 54b9c3b | 2008-04-21 01:28:02 +0000 | [diff] [blame] | 114 | SmallVector<BasicBlock*, 8> OutsideBlocks; |
Chris Lattner | 38acf9e | 2002-09-26 16:17:31 +0000 | [diff] [blame] | 115 | for (pred_iterator PI = pred_begin(Header), PE = pred_end(Header); |
Gabor Greif | 9672414 | 2010-07-09 14:02:13 +0000 | [diff] [blame] | 116 | PI != PE; ++PI) { |
| 117 | BasicBlock *P = *PI; |
| 118 | if (!L->contains(P)) { // Coming in from outside the loop? |
Dan Gohman | f4e82d1 | 2009-11-05 21:14:46 +0000 | [diff] [blame] | 119 | // If the loop is branched to from an indirect branch, we won't |
| 120 | // be able to fully transform the loop, because it prohibits |
| 121 | // edge splitting. |
Gabor Greif | 9672414 | 2010-07-09 14:02:13 +0000 | [diff] [blame] | 122 | if (isa<IndirectBrInst>(P->getTerminator())) return 0; |
Dan Gohman | f4e82d1 | 2009-11-05 21:14:46 +0000 | [diff] [blame] | 123 | |
| 124 | // Keep track of it. |
Gabor Greif | 9672414 | 2010-07-09 14:02:13 +0000 | [diff] [blame] | 125 | OutsideBlocks.push_back(P); |
Dan Gohman | f4e82d1 | 2009-11-05 21:14:46 +0000 | [diff] [blame] | 126 | } |
Gabor Greif | 9672414 | 2010-07-09 14:02:13 +0000 | [diff] [blame] | 127 | } |
Misha Brukman | fd93908 | 2005-04-21 23:48:37 +0000 | [diff] [blame] | 128 | |
Chris Lattner | c398457 | 2006-09-23 07:40:52 +0000 | [diff] [blame] | 129 | // Split out the loop pre-header. |
Eli Friedman | 7d1ff37 | 2011-12-15 00:50:34 +0000 | [diff] [blame] | 130 | BasicBlock *PreheaderBB; |
| 131 | if (!Header->isLandingPad()) { |
| 132 | PreheaderBB = SplitBlockPredecessors(Header, OutsideBlocks, ".preheader", |
Hal Finkel | fc32605 | 2013-05-20 16:47:07 +0000 | [diff] [blame] | 133 | PP); |
Eli Friedman | 7d1ff37 | 2011-12-15 00:50:34 +0000 | [diff] [blame] | 134 | } else { |
| 135 | SmallVector<BasicBlock*, 2> NewBBs; |
Andrew Trick | cd1142e | 2012-03-20 21:24:47 +0000 | [diff] [blame] | 136 | SplitLandingPadPredecessors(Header, OutsideBlocks, ".preheader", |
Hal Finkel | fc32605 | 2013-05-20 16:47:07 +0000 | [diff] [blame] | 137 | ".split-lp", PP, NewBBs); |
Eli Friedman | 7d1ff37 | 2011-12-15 00:50:34 +0000 | [diff] [blame] | 138 | PreheaderBB = NewBBs[0]; |
| 139 | } |
Chris Lattner | 9f879cf | 2003-02-27 22:48:57 +0000 | [diff] [blame] | 140 | |
Eli Friedman | 7d1ff37 | 2011-12-15 00:50:34 +0000 | [diff] [blame] | 141 | PreheaderBB->getTerminator()->setDebugLoc( |
| 142 | Header->getFirstNonPHI()->getDebugLoc()); |
| 143 | DEBUG(dbgs() << "LoopSimplify: Creating pre-header " |
| 144 | << PreheaderBB->getName() << "\n"); |
Dan Gohman | c5e49c6 | 2010-03-01 17:55:27 +0000 | [diff] [blame] | 145 | |
Chris Lattner | 120fce5 | 2006-09-23 08:19:21 +0000 | [diff] [blame] | 146 | // Make sure that NewBB is put someplace intelligent, which doesn't mess up |
| 147 | // code layout too horribly. |
Stephen Hines | 36b5688 | 2014-04-23 16:57:46 -0700 | [diff] [blame] | 148 | placeSplitBlockCarefully(PreheaderBB, OutsideBlocks, L); |
Dan Gohman | 0df6e09 | 2009-07-14 01:37:59 +0000 | [diff] [blame] | 149 | |
Eli Friedman | 7d1ff37 | 2011-12-15 00:50:34 +0000 | [diff] [blame] | 150 | return PreheaderBB; |
Chris Lattner | dbf3cd7 | 2003-02-27 20:27:08 +0000 | [diff] [blame] | 151 | } |
| 152 | |
Stephen Hines | 36b5688 | 2014-04-23 16:57:46 -0700 | [diff] [blame] | 153 | /// \brief Ensure that the loop preheader dominates all exit blocks. |
| 154 | /// |
| 155 | /// This method is used to split exit blocks that have predecessors outside of |
| 156 | /// the loop. |
| 157 | static BasicBlock *rewriteLoopExitBlock(Loop *L, BasicBlock *Exit, Pass *PP) { |
Chris Lattner | 54b9c3b | 2008-04-21 01:28:02 +0000 | [diff] [blame] | 158 | SmallVector<BasicBlock*, 8> LoopBlocks; |
Gabor Greif | 9672414 | 2010-07-09 14:02:13 +0000 | [diff] [blame] | 159 | for (pred_iterator I = pred_begin(Exit), E = pred_end(Exit); I != E; ++I) { |
| 160 | BasicBlock *P = *I; |
| 161 | if (L->contains(P)) { |
Dan Gohman | f4e82d1 | 2009-11-05 21:14:46 +0000 | [diff] [blame] | 162 | // Don't do this if the loop is exited via an indirect branch. |
Gabor Greif | 9672414 | 2010-07-09 14:02:13 +0000 | [diff] [blame] | 163 | if (isa<IndirectBrInst>(P->getTerminator())) return 0; |
Dan Gohman | f4e82d1 | 2009-11-05 21:14:46 +0000 | [diff] [blame] | 164 | |
Gabor Greif | 9672414 | 2010-07-09 14:02:13 +0000 | [diff] [blame] | 165 | LoopBlocks.push_back(P); |
Dan Gohman | f4e82d1 | 2009-11-05 21:14:46 +0000 | [diff] [blame] | 166 | } |
Gabor Greif | 9672414 | 2010-07-09 14:02:13 +0000 | [diff] [blame] | 167 | } |
Chris Lattner | dbf3cd7 | 2003-02-27 20:27:08 +0000 | [diff] [blame] | 168 | |
Chris Lattner | 7e7ad49 | 2003-02-27 22:31:07 +0000 | [diff] [blame] | 169 | assert(!LoopBlocks.empty() && "No edges coming in from outside the loop?"); |
Bill Wendling | b29ec06 | 2011-08-19 00:09:22 +0000 | [diff] [blame] | 170 | BasicBlock *NewExitBB = 0; |
| 171 | |
| 172 | if (Exit->isLandingPad()) { |
| 173 | SmallVector<BasicBlock*, 2> NewBBs; |
| 174 | SplitLandingPadPredecessors(Exit, ArrayRef<BasicBlock*>(&LoopBlocks[0], |
| 175 | LoopBlocks.size()), |
| 176 | ".loopexit", ".nonloopexit", |
Stephen Hines | 36b5688 | 2014-04-23 16:57:46 -0700 | [diff] [blame] | 177 | PP, NewBBs); |
Bill Wendling | b29ec06 | 2011-08-19 00:09:22 +0000 | [diff] [blame] | 178 | NewExitBB = NewBBs[0]; |
| 179 | } else { |
Stephen Hines | 36b5688 | 2014-04-23 16:57:46 -0700 | [diff] [blame] | 180 | NewExitBB = SplitBlockPredecessors(Exit, LoopBlocks, ".loopexit", PP); |
Bill Wendling | b29ec06 | 2011-08-19 00:09:22 +0000 | [diff] [blame] | 181 | } |
Chris Lattner | 7e7ad49 | 2003-02-27 22:31:07 +0000 | [diff] [blame] | 182 | |
Chris Lattner | 9fc5cdf | 2011-01-02 22:09:33 +0000 | [diff] [blame] | 183 | DEBUG(dbgs() << "LoopSimplify: Creating dedicated exit block " |
Bill Wendling | b29ec06 | 2011-08-19 00:09:22 +0000 | [diff] [blame] | 184 | << NewExitBB->getName() << "\n"); |
| 185 | return NewExitBB; |
Chris Lattner | 2ab6a73 | 2003-10-13 00:37:13 +0000 | [diff] [blame] | 186 | } |
| 187 | |
Stephen Hines | 36b5688 | 2014-04-23 16:57:46 -0700 | [diff] [blame] | 188 | /// Add the specified block, and all of its predecessors, to the specified set, |
| 189 | /// if it's not already in there. Stop predecessor traversal when we reach |
| 190 | /// StopBlock. |
| 191 | static void addBlockAndPredsToSet(BasicBlock *InputBB, BasicBlock *StopBlock, |
Chris Lattner | 529b28d | 2004-04-13 05:05:33 +0000 | [diff] [blame] | 192 | std::set<BasicBlock*> &Blocks) { |
Stephen Hines | 36b5688 | 2014-04-23 16:57:46 -0700 | [diff] [blame] | 193 | SmallVector<BasicBlock *, 8> Worklist; |
| 194 | Worklist.push_back(InputBB); |
Devang Patel | 58d7fbf | 2007-04-20 20:04:37 +0000 | [diff] [blame] | 195 | do { |
Stephen Hines | 36b5688 | 2014-04-23 16:57:46 -0700 | [diff] [blame] | 196 | BasicBlock *BB = Worklist.pop_back_val(); |
Devang Patel | 58d7fbf | 2007-04-20 20:04:37 +0000 | [diff] [blame] | 197 | if (Blocks.insert(BB).second && BB != StopBlock) |
| 198 | // If BB is not already processed and it is not a stop block then |
| 199 | // insert its predecessor in the work list |
| 200 | for (pred_iterator I = pred_begin(BB), E = pred_end(BB); I != E; ++I) { |
| 201 | BasicBlock *WBB = *I; |
Stephen Hines | 36b5688 | 2014-04-23 16:57:46 -0700 | [diff] [blame] | 202 | Worklist.push_back(WBB); |
Devang Patel | 58d7fbf | 2007-04-20 20:04:37 +0000 | [diff] [blame] | 203 | } |
Stephen Hines | 36b5688 | 2014-04-23 16:57:46 -0700 | [diff] [blame] | 204 | } while (!Worklist.empty()); |
Chris Lattner | 529b28d | 2004-04-13 05:05:33 +0000 | [diff] [blame] | 205 | } |
| 206 | |
Stephen Hines | 36b5688 | 2014-04-23 16:57:46 -0700 | [diff] [blame] | 207 | /// \brief The first part of loop-nestification is to find a PHI node that tells |
| 208 | /// us how to partition the loops. |
| 209 | static PHINode *findPHIToPartitionLoops(Loop *L, AliasAnalysis *AA, |
| 210 | DominatorTree *DT) { |
Alkis Evlogimenos | 200a360 | 2004-09-28 02:40:37 +0000 | [diff] [blame] | 211 | for (BasicBlock::iterator I = L->getHeader()->begin(); isa<PHINode>(I); ) { |
| 212 | PHINode *PN = cast<PHINode>(I); |
Chris Lattner | 1f62f82 | 2004-04-13 15:21:18 +0000 | [diff] [blame] | 213 | ++I; |
Chad Rosier | 618c1db | 2011-12-01 03:08:23 +0000 | [diff] [blame] | 214 | if (Value *V = SimplifyInstruction(PN, 0, 0, DT)) { |
Duncan Sands | 67fb341 | 2011-01-02 13:38:21 +0000 | [diff] [blame] | 215 | // This is a degenerate PHI already, don't modify it! |
| 216 | PN->replaceAllUsesWith(V); |
| 217 | if (AA) AA->deleteValue(PN); |
| 218 | PN->eraseFromParent(); |
| 219 | continue; |
| 220 | } |
Chris Lattner | c30bda7 | 2004-10-17 21:22:38 +0000 | [diff] [blame] | 221 | |
| 222 | // Scan this PHI node looking for a use of the PHI node by itself. |
| 223 | for (unsigned i = 0, e = PN->getNumIncomingValues(); i != e; ++i) |
| 224 | if (PN->getIncomingValue(i) == PN && |
| 225 | L->contains(PN->getIncomingBlock(i))) |
| 226 | // We found something tasty to remove. |
| 227 | return PN; |
Chris Lattner | 1f62f82 | 2004-04-13 15:21:18 +0000 | [diff] [blame] | 228 | } |
| 229 | return 0; |
| 230 | } |
| 231 | |
Stephen Hines | 36b5688 | 2014-04-23 16:57:46 -0700 | [diff] [blame] | 232 | /// \brief If this loop has multiple backedges, try to pull one of them out into |
| 233 | /// a nested loop. |
| 234 | /// |
| 235 | /// This is important for code that looks like |
Chris Lattner | 529b28d | 2004-04-13 05:05:33 +0000 | [diff] [blame] | 236 | /// this: |
| 237 | /// |
| 238 | /// Loop: |
| 239 | /// ... |
| 240 | /// br cond, Loop, Next |
| 241 | /// ... |
| 242 | /// br cond2, Loop, Out |
| 243 | /// |
| 244 | /// To identify this common case, we look at the PHI nodes in the header of the |
| 245 | /// loop. PHI nodes with unchanging values on one backedge correspond to values |
| 246 | /// that change in the "outer" loop, but not in the "inner" loop. |
| 247 | /// |
| 248 | /// If we are able to separate out a loop, return the new outer loop that was |
| 249 | /// created. |
| 250 | /// |
Stephen Hines | 36b5688 | 2014-04-23 16:57:46 -0700 | [diff] [blame] | 251 | static Loop *separateNestedLoop(Loop *L, BasicBlock *Preheader, |
| 252 | AliasAnalysis *AA, DominatorTree *DT, |
| 253 | LoopInfo *LI, ScalarEvolution *SE, Pass *PP) { |
Andrew Trick | 7edc277 | 2012-03-20 21:24:52 +0000 | [diff] [blame] | 254 | // Don't try to separate loops without a preheader. |
Eli Friedman | 7d1ff37 | 2011-12-15 00:50:34 +0000 | [diff] [blame] | 255 | if (!Preheader) |
| 256 | return 0; |
| 257 | |
| 258 | // The header is not a landing pad; preheader insertion should ensure this. |
| 259 | assert(!L->getHeader()->isLandingPad() && |
| 260 | "Can't insert backedge to landing pad"); |
| 261 | |
Stephen Hines | 36b5688 | 2014-04-23 16:57:46 -0700 | [diff] [blame] | 262 | PHINode *PN = findPHIToPartitionLoops(L, AA, DT); |
Chris Lattner | 1f62f82 | 2004-04-13 15:21:18 +0000 | [diff] [blame] | 263 | if (PN == 0) return 0; // No known way to partition. |
Chris Lattner | 529b28d | 2004-04-13 05:05:33 +0000 | [diff] [blame] | 264 | |
Chris Lattner | 1f62f82 | 2004-04-13 15:21:18 +0000 | [diff] [blame] | 265 | // Pull out all predecessors that have varying values in the loop. This |
| 266 | // handles the case when a PHI node has multiple instances of itself as |
| 267 | // arguments. |
Chris Lattner | 54b9c3b | 2008-04-21 01:28:02 +0000 | [diff] [blame] | 268 | SmallVector<BasicBlock*, 8> OuterLoopPreds; |
Andrew Trick | 7edc277 | 2012-03-20 21:24:52 +0000 | [diff] [blame] | 269 | for (unsigned i = 0, e = PN->getNumIncomingValues(); i != e; ++i) { |
Chris Lattner | 1f62f82 | 2004-04-13 15:21:18 +0000 | [diff] [blame] | 270 | if (PN->getIncomingValue(i) != PN || |
Andrew Trick | 7edc277 | 2012-03-20 21:24:52 +0000 | [diff] [blame] | 271 | !L->contains(PN->getIncomingBlock(i))) { |
| 272 | // We can't split indirectbr edges. |
| 273 | if (isa<IndirectBrInst>(PN->getIncomingBlock(i)->getTerminator())) |
| 274 | return 0; |
Chris Lattner | 1f62f82 | 2004-04-13 15:21:18 +0000 | [diff] [blame] | 275 | OuterLoopPreds.push_back(PN->getIncomingBlock(i)); |
Andrew Trick | 7edc277 | 2012-03-20 21:24:52 +0000 | [diff] [blame] | 276 | } |
| 277 | } |
Dan Gohman | c5e49c6 | 2010-03-01 17:55:27 +0000 | [diff] [blame] | 278 | DEBUG(dbgs() << "LoopSimplify: Splitting out a new outer loop\n"); |
| 279 | |
Dan Gohman | ffa75cd | 2010-09-04 02:42:48 +0000 | [diff] [blame] | 280 | // If ScalarEvolution is around and knows anything about values in |
| 281 | // this loop, tell it to forget them, because we're about to |
| 282 | // substantially change it. |
| 283 | if (SE) |
| 284 | SE->forgetLoop(L); |
| 285 | |
Chris Lattner | 4b66242 | 2004-04-13 16:23:25 +0000 | [diff] [blame] | 286 | BasicBlock *Header = L->getHeader(); |
Jakub Staszak | 2fac1d5 | 2011-12-09 21:19:53 +0000 | [diff] [blame] | 287 | BasicBlock *NewBB = |
Stephen Hines | 36b5688 | 2014-04-23 16:57:46 -0700 | [diff] [blame] | 288 | SplitBlockPredecessors(Header, OuterLoopPreds, ".outer", PP); |
Chris Lattner | 529b28d | 2004-04-13 05:05:33 +0000 | [diff] [blame] | 289 | |
Chris Lattner | 120fce5 | 2006-09-23 08:19:21 +0000 | [diff] [blame] | 290 | // Make sure that NewBB is put someplace intelligent, which doesn't mess up |
| 291 | // code layout too horribly. |
Stephen Hines | 36b5688 | 2014-04-23 16:57:46 -0700 | [diff] [blame] | 292 | placeSplitBlockCarefully(NewBB, OuterLoopPreds, L); |
Andrew Trick | 1c3ff65 | 2011-08-03 18:28:21 +0000 | [diff] [blame] | 293 | |
Chris Lattner | 529b28d | 2004-04-13 05:05:33 +0000 | [diff] [blame] | 294 | // Create the new outer loop. |
| 295 | Loop *NewOuter = new Loop(); |
| 296 | |
Chris Lattner | 529b28d | 2004-04-13 05:05:33 +0000 | [diff] [blame] | 297 | // Change the parent loop to use the outer loop as its child now. |
| 298 | if (Loop *Parent = L->getParentLoop()) |
| 299 | Parent->replaceChildLoopWith(L, NewOuter); |
| 300 | else |
Chris Lattner | c27e056 | 2006-02-14 22:34:08 +0000 | [diff] [blame] | 301 | LI->changeTopLevelLoop(L, NewOuter); |
Chris Lattner | 529b28d | 2004-04-13 05:05:33 +0000 | [diff] [blame] | 302 | |
Chris Lattner | 529b28d | 2004-04-13 05:05:33 +0000 | [diff] [blame] | 303 | // L is now a subloop of our outer loop. |
| 304 | NewOuter->addChildLoop(L); |
| 305 | |
Dan Gohman | 9b78763 | 2008-06-22 20:18:58 +0000 | [diff] [blame] | 306 | for (Loop::block_iterator I = L->block_begin(), E = L->block_end(); |
| 307 | I != E; ++I) |
| 308 | NewOuter->addBlockEntry(*I); |
Chris Lattner | 529b28d | 2004-04-13 05:05:33 +0000 | [diff] [blame] | 309 | |
Dan Gohman | 5c89b52 | 2009-09-08 15:45:00 +0000 | [diff] [blame] | 310 | // Now reset the header in L, which had been moved by |
| 311 | // SplitBlockPredecessors for the outer loop. |
| 312 | L->moveToHeader(Header); |
| 313 | |
Chris Lattner | 529b28d | 2004-04-13 05:05:33 +0000 | [diff] [blame] | 314 | // Determine which blocks should stay in L and which should be moved out to |
| 315 | // the Outer loop now. |
Chris Lattner | 529b28d | 2004-04-13 05:05:33 +0000 | [diff] [blame] | 316 | std::set<BasicBlock*> BlocksInL; |
Gabor Greif | 9672414 | 2010-07-09 14:02:13 +0000 | [diff] [blame] | 317 | for (pred_iterator PI=pred_begin(Header), E = pred_end(Header); PI!=E; ++PI) { |
| 318 | BasicBlock *P = *PI; |
| 319 | if (DT->dominates(Header, P)) |
Stephen Hines | 36b5688 | 2014-04-23 16:57:46 -0700 | [diff] [blame] | 320 | addBlockAndPredsToSet(P, Header, BlocksInL); |
Gabor Greif | 9672414 | 2010-07-09 14:02:13 +0000 | [diff] [blame] | 321 | } |
Chris Lattner | 529b28d | 2004-04-13 05:05:33 +0000 | [diff] [blame] | 322 | |
| 323 | // Scan all of the loop children of L, moving them to OuterLoop if they are |
| 324 | // not part of the inner loop. |
David Greene | c08fa28 | 2007-06-29 02:53:16 +0000 | [diff] [blame] | 325 | const std::vector<Loop*> &SubLoops = L->getSubLoops(); |
| 326 | for (size_t I = 0; I != SubLoops.size(); ) |
| 327 | if (BlocksInL.count(SubLoops[I]->getHeader())) |
Chris Lattner | 529b28d | 2004-04-13 05:05:33 +0000 | [diff] [blame] | 328 | ++I; // Loop remains in L |
| 329 | else |
David Greene | c08fa28 | 2007-06-29 02:53:16 +0000 | [diff] [blame] | 330 | NewOuter->addChildLoop(L->removeChildLoop(SubLoops.begin() + I)); |
Chris Lattner | 529b28d | 2004-04-13 05:05:33 +0000 | [diff] [blame] | 331 | |
| 332 | // Now that we know which blocks are in L and which need to be moved to |
| 333 | // OuterLoop, move any blocks that need it. |
| 334 | for (unsigned i = 0; i != L->getBlocks().size(); ++i) { |
| 335 | BasicBlock *BB = L->getBlocks()[i]; |
| 336 | if (!BlocksInL.count(BB)) { |
| 337 | // Move this block to the parent, updating the exit blocks sets |
| 338 | L->removeBlockFromLoop(BB); |
Chris Lattner | c27e056 | 2006-02-14 22:34:08 +0000 | [diff] [blame] | 339 | if ((*LI)[BB] == L) |
| 340 | LI->changeLoopFor(BB, NewOuter); |
Chris Lattner | 529b28d | 2004-04-13 05:05:33 +0000 | [diff] [blame] | 341 | --i; |
| 342 | } |
| 343 | } |
| 344 | |
Chris Lattner | 529b28d | 2004-04-13 05:05:33 +0000 | [diff] [blame] | 345 | return NewOuter; |
| 346 | } |
| 347 | |
Stephen Hines | 36b5688 | 2014-04-23 16:57:46 -0700 | [diff] [blame] | 348 | /// \brief This method is called when the specified loop has more than one |
| 349 | /// backedge in it. |
Chris Lattner | 2ab6a73 | 2003-10-13 00:37:13 +0000 | [diff] [blame] | 350 | /// |
Stephen Hines | 36b5688 | 2014-04-23 16:57:46 -0700 | [diff] [blame] | 351 | /// If this occurs, revector all of these backedges to target a new basic block |
| 352 | /// and have that block branch to the loop header. This ensures that loops |
| 353 | /// have exactly one backedge. |
| 354 | static BasicBlock *insertUniqueBackedgeBlock(Loop *L, BasicBlock *Preheader, |
| 355 | AliasAnalysis *AA, |
| 356 | DominatorTree *DT, LoopInfo *LI) { |
Chris Lattner | 2ab6a73 | 2003-10-13 00:37:13 +0000 | [diff] [blame] | 357 | assert(L->getNumBackEdges() > 1 && "Must have > 1 backedge!"); |
| 358 | |
| 359 | // Get information about the loop |
Chris Lattner | 2ab6a73 | 2003-10-13 00:37:13 +0000 | [diff] [blame] | 360 | BasicBlock *Header = L->getHeader(); |
| 361 | Function *F = Header->getParent(); |
| 362 | |
Dan Gohman | f4e82d1 | 2009-11-05 21:14:46 +0000 | [diff] [blame] | 363 | // Unique backedge insertion currently depends on having a preheader. |
| 364 | if (!Preheader) |
| 365 | return 0; |
| 366 | |
Eli Friedman | 7d1ff37 | 2011-12-15 00:50:34 +0000 | [diff] [blame] | 367 | // The header is not a landing pad; preheader insertion should ensure this. |
| 368 | assert(!Header->isLandingPad() && "Can't insert backedge to landing pad"); |
| 369 | |
Chris Lattner | 2ab6a73 | 2003-10-13 00:37:13 +0000 | [diff] [blame] | 370 | // Figure out which basic blocks contain back-edges to the loop header. |
| 371 | std::vector<BasicBlock*> BackedgeBlocks; |
Gabor Greif | bf2eefd | 2010-07-09 16:26:41 +0000 | [diff] [blame] | 372 | for (pred_iterator I = pred_begin(Header), E = pred_end(Header); I != E; ++I){ |
| 373 | BasicBlock *P = *I; |
Dan Gohman | c2f4006 | 2010-08-14 00:43:09 +0000 | [diff] [blame] | 374 | |
| 375 | // Indirectbr edges cannot be split, so we must fail if we find one. |
| 376 | if (isa<IndirectBrInst>(P->getTerminator())) |
| 377 | return 0; |
| 378 | |
Gabor Greif | bf2eefd | 2010-07-09 16:26:41 +0000 | [diff] [blame] | 379 | if (P != Preheader) BackedgeBlocks.push_back(P); |
| 380 | } |
Chris Lattner | 2ab6a73 | 2003-10-13 00:37:13 +0000 | [diff] [blame] | 381 | |
| 382 | // Create and insert the new backedge block... |
Owen Anderson | 1d0be15 | 2009-08-13 21:58:54 +0000 | [diff] [blame] | 383 | BasicBlock *BEBlock = BasicBlock::Create(Header->getContext(), |
| 384 | Header->getName()+".backedge", F); |
Gabor Greif | 051a950 | 2008-04-06 20:25:17 +0000 | [diff] [blame] | 385 | BranchInst *BETerminator = BranchInst::Create(Header, BEBlock); |
Chris Lattner | 2ab6a73 | 2003-10-13 00:37:13 +0000 | [diff] [blame] | 386 | |
Chris Lattner | 9fc5cdf | 2011-01-02 22:09:33 +0000 | [diff] [blame] | 387 | DEBUG(dbgs() << "LoopSimplify: Inserting unique backedge block " |
| 388 | << BEBlock->getName() << "\n"); |
Dan Gohman | c5e49c6 | 2010-03-01 17:55:27 +0000 | [diff] [blame] | 389 | |
Chris Lattner | 2ab6a73 | 2003-10-13 00:37:13 +0000 | [diff] [blame] | 390 | // Move the new backedge block to right after the last backedge block. |
| 391 | Function::iterator InsertPos = BackedgeBlocks.back(); ++InsertPos; |
| 392 | F->getBasicBlockList().splice(InsertPos, F->getBasicBlockList(), BEBlock); |
Misha Brukman | fd93908 | 2005-04-21 23:48:37 +0000 | [diff] [blame] | 393 | |
Chris Lattner | 2ab6a73 | 2003-10-13 00:37:13 +0000 | [diff] [blame] | 394 | // Now that the block has been inserted into the function, create PHI nodes in |
| 395 | // the backedge block which correspond to any PHI nodes in the header block. |
Alkis Evlogimenos | 200a360 | 2004-09-28 02:40:37 +0000 | [diff] [blame] | 396 | for (BasicBlock::iterator I = Header->begin(); isa<PHINode>(I); ++I) { |
| 397 | PHINode *PN = cast<PHINode>(I); |
Jay Foad | 3ecfc86 | 2011-03-30 11:28:46 +0000 | [diff] [blame] | 398 | PHINode *NewPN = PHINode::Create(PN->getType(), BackedgeBlocks.size(), |
| 399 | PN->getName()+".be", BETerminator); |
Chris Lattner | cec5b88 | 2005-03-25 06:37:22 +0000 | [diff] [blame] | 400 | if (AA) AA->copyValue(PN, NewPN); |
Chris Lattner | 2ab6a73 | 2003-10-13 00:37:13 +0000 | [diff] [blame] | 401 | |
| 402 | // Loop over the PHI node, moving all entries except the one for the |
| 403 | // preheader over to the new PHI node. |
| 404 | unsigned PreheaderIdx = ~0U; |
| 405 | bool HasUniqueIncomingValue = true; |
| 406 | Value *UniqueValue = 0; |
| 407 | for (unsigned i = 0, e = PN->getNumIncomingValues(); i != e; ++i) { |
| 408 | BasicBlock *IBB = PN->getIncomingBlock(i); |
| 409 | Value *IV = PN->getIncomingValue(i); |
| 410 | if (IBB == Preheader) { |
| 411 | PreheaderIdx = i; |
| 412 | } else { |
| 413 | NewPN->addIncoming(IV, IBB); |
| 414 | if (HasUniqueIncomingValue) { |
| 415 | if (UniqueValue == 0) |
| 416 | UniqueValue = IV; |
| 417 | else if (UniqueValue != IV) |
| 418 | HasUniqueIncomingValue = false; |
| 419 | } |
| 420 | } |
| 421 | } |
Misha Brukman | fd93908 | 2005-04-21 23:48:37 +0000 | [diff] [blame] | 422 | |
Chris Lattner | 2ab6a73 | 2003-10-13 00:37:13 +0000 | [diff] [blame] | 423 | // Delete all of the incoming values from the old PN except the preheader's |
| 424 | assert(PreheaderIdx != ~0U && "PHI has no preheader entry??"); |
| 425 | if (PreheaderIdx != 0) { |
| 426 | PN->setIncomingValue(0, PN->getIncomingValue(PreheaderIdx)); |
| 427 | PN->setIncomingBlock(0, PN->getIncomingBlock(PreheaderIdx)); |
| 428 | } |
Chris Lattner | 5551706 | 2005-01-29 00:39:08 +0000 | [diff] [blame] | 429 | // Nuke all entries except the zero'th. |
| 430 | for (unsigned i = 0, e = PN->getNumIncomingValues()-1; i != e; ++i) |
| 431 | PN->removeIncomingValue(e-i, false); |
Chris Lattner | 2ab6a73 | 2003-10-13 00:37:13 +0000 | [diff] [blame] | 432 | |
| 433 | // Finally, add the newly constructed PHI node as the entry for the BEBlock. |
| 434 | PN->addIncoming(NewPN, BEBlock); |
| 435 | |
| 436 | // As an optimization, if all incoming values in the new PhiNode (which is a |
| 437 | // subset of the incoming values of the old PHI node) have the same value, |
| 438 | // eliminate the PHI Node. |
| 439 | if (HasUniqueIncomingValue) { |
| 440 | NewPN->replaceAllUsesWith(UniqueValue); |
Chris Lattner | cec5b88 | 2005-03-25 06:37:22 +0000 | [diff] [blame] | 441 | if (AA) AA->deleteValue(NewPN); |
Chris Lattner | 2ab6a73 | 2003-10-13 00:37:13 +0000 | [diff] [blame] | 442 | BEBlock->getInstList().erase(NewPN); |
| 443 | } |
| 444 | } |
| 445 | |
| 446 | // Now that all of the PHI nodes have been inserted and adjusted, modify the |
Nick Lewycky | 280a6e6 | 2008-04-25 16:53:59 +0000 | [diff] [blame] | 447 | // backedge blocks to just to the BEBlock instead of the header. |
Chris Lattner | 2ab6a73 | 2003-10-13 00:37:13 +0000 | [diff] [blame] | 448 | for (unsigned i = 0, e = BackedgeBlocks.size(); i != e; ++i) { |
| 449 | TerminatorInst *TI = BackedgeBlocks[i]->getTerminator(); |
| 450 | for (unsigned Op = 0, e = TI->getNumSuccessors(); Op != e; ++Op) |
| 451 | if (TI->getSuccessor(Op) == Header) |
| 452 | TI->setSuccessor(Op, BEBlock); |
| 453 | } |
| 454 | |
| 455 | //===--- Update all analyses which we must preserve now -----------------===// |
| 456 | |
| 457 | // Update Loop Information - we know that this block is now in the current |
| 458 | // loop and all parent loops. |
Owen Anderson | d735ee8 | 2007-11-27 03:43:35 +0000 | [diff] [blame] | 459 | L->addBasicBlockToLoop(BEBlock, LI->getBase()); |
Chris Lattner | 2ab6a73 | 2003-10-13 00:37:13 +0000 | [diff] [blame] | 460 | |
Devang Patel | 0e7f728 | 2007-06-21 17:23:45 +0000 | [diff] [blame] | 461 | // Update dominator information |
| 462 | DT->splitBlock(BEBlock); |
Dan Gohman | f4e82d1 | 2009-11-05 21:14:46 +0000 | [diff] [blame] | 463 | |
| 464 | return BEBlock; |
| 465 | } |
| 466 | |
Stephen Hines | 36b5688 | 2014-04-23 16:57:46 -0700 | [diff] [blame] | 467 | /// \brief Simplify one loop and queue further loops for simplification. |
| 468 | /// |
| 469 | /// FIXME: Currently this accepts both lots of analyses that it uses and a raw |
| 470 | /// Pass pointer. The Pass pointer is used by numerous utilities to update |
| 471 | /// specific analyses. Rather than a pass it would be much cleaner and more |
| 472 | /// explicit if they accepted the analysis directly and then updated it. |
| 473 | static bool simplifyOneLoop(Loop *L, SmallVectorImpl<Loop *> &Worklist, |
| 474 | AliasAnalysis *AA, DominatorTree *DT, LoopInfo *LI, |
| 475 | ScalarEvolution *SE, Pass *PP) { |
| 476 | bool Changed = false; |
| 477 | ReprocessLoop: |
| 478 | |
| 479 | // Check to see that no blocks (other than the header) in this loop have |
| 480 | // predecessors that are not in the loop. This is not valid for natural |
| 481 | // loops, but can occur if the blocks are unreachable. Since they are |
| 482 | // unreachable we can just shamelessly delete those CFG edges! |
| 483 | for (Loop::block_iterator BB = L->block_begin(), E = L->block_end(); |
| 484 | BB != E; ++BB) { |
| 485 | if (*BB == L->getHeader()) continue; |
| 486 | |
| 487 | SmallPtrSet<BasicBlock*, 4> BadPreds; |
| 488 | for (pred_iterator PI = pred_begin(*BB), |
| 489 | PE = pred_end(*BB); PI != PE; ++PI) { |
| 490 | BasicBlock *P = *PI; |
| 491 | if (!L->contains(P)) |
| 492 | BadPreds.insert(P); |
| 493 | } |
| 494 | |
| 495 | // Delete each unique out-of-loop (and thus dead) predecessor. |
| 496 | for (SmallPtrSet<BasicBlock*, 4>::iterator I = BadPreds.begin(), |
| 497 | E = BadPreds.end(); I != E; ++I) { |
| 498 | |
| 499 | DEBUG(dbgs() << "LoopSimplify: Deleting edge from dead predecessor " |
| 500 | << (*I)->getName() << "\n"); |
| 501 | |
| 502 | // Inform each successor of each dead pred. |
| 503 | for (succ_iterator SI = succ_begin(*I), SE = succ_end(*I); SI != SE; ++SI) |
| 504 | (*SI)->removePredecessor(*I); |
| 505 | // Zap the dead pred's terminator and replace it with unreachable. |
| 506 | TerminatorInst *TI = (*I)->getTerminator(); |
| 507 | TI->replaceAllUsesWith(UndefValue::get(TI->getType())); |
| 508 | (*I)->getTerminator()->eraseFromParent(); |
| 509 | new UnreachableInst((*I)->getContext(), *I); |
| 510 | Changed = true; |
| 511 | } |
| 512 | } |
| 513 | |
| 514 | // If there are exiting blocks with branches on undef, resolve the undef in |
| 515 | // the direction which will exit the loop. This will help simplify loop |
| 516 | // trip count computations. |
| 517 | SmallVector<BasicBlock*, 8> ExitingBlocks; |
| 518 | L->getExitingBlocks(ExitingBlocks); |
| 519 | for (SmallVectorImpl<BasicBlock *>::iterator I = ExitingBlocks.begin(), |
| 520 | E = ExitingBlocks.end(); I != E; ++I) |
| 521 | if (BranchInst *BI = dyn_cast<BranchInst>((*I)->getTerminator())) |
| 522 | if (BI->isConditional()) { |
| 523 | if (UndefValue *Cond = dyn_cast<UndefValue>(BI->getCondition())) { |
| 524 | |
| 525 | DEBUG(dbgs() << "LoopSimplify: Resolving \"br i1 undef\" to exit in " |
| 526 | << (*I)->getName() << "\n"); |
| 527 | |
| 528 | BI->setCondition(ConstantInt::get(Cond->getType(), |
| 529 | !L->contains(BI->getSuccessor(0)))); |
| 530 | |
| 531 | // This may make the loop analyzable, force SCEV recomputation. |
| 532 | if (SE) |
| 533 | SE->forgetLoop(L); |
| 534 | |
| 535 | Changed = true; |
| 536 | } |
| 537 | } |
| 538 | |
| 539 | // Does the loop already have a preheader? If so, don't insert one. |
| 540 | BasicBlock *Preheader = L->getLoopPreheader(); |
| 541 | if (!Preheader) { |
| 542 | Preheader = InsertPreheaderForLoop(L, PP); |
| 543 | if (Preheader) { |
| 544 | ++NumInserted; |
| 545 | Changed = true; |
| 546 | } |
| 547 | } |
| 548 | |
| 549 | // Next, check to make sure that all exit nodes of the loop only have |
| 550 | // predecessors that are inside of the loop. This check guarantees that the |
| 551 | // loop preheader/header will dominate the exit blocks. If the exit block has |
| 552 | // predecessors from outside of the loop, split the edge now. |
| 553 | SmallVector<BasicBlock*, 8> ExitBlocks; |
| 554 | L->getExitBlocks(ExitBlocks); |
| 555 | |
| 556 | SmallSetVector<BasicBlock *, 8> ExitBlockSet(ExitBlocks.begin(), |
| 557 | ExitBlocks.end()); |
| 558 | for (SmallSetVector<BasicBlock *, 8>::iterator I = ExitBlockSet.begin(), |
| 559 | E = ExitBlockSet.end(); I != E; ++I) { |
| 560 | BasicBlock *ExitBlock = *I; |
| 561 | for (pred_iterator PI = pred_begin(ExitBlock), PE = pred_end(ExitBlock); |
| 562 | PI != PE; ++PI) |
| 563 | // Must be exactly this loop: no subloops, parent loops, or non-loop preds |
| 564 | // allowed. |
| 565 | if (!L->contains(*PI)) { |
| 566 | if (rewriteLoopExitBlock(L, ExitBlock, PP)) { |
| 567 | ++NumInserted; |
| 568 | Changed = true; |
| 569 | } |
| 570 | break; |
| 571 | } |
| 572 | } |
| 573 | |
| 574 | // If the header has more than two predecessors at this point (from the |
| 575 | // preheader and from multiple backedges), we must adjust the loop. |
| 576 | BasicBlock *LoopLatch = L->getLoopLatch(); |
| 577 | if (!LoopLatch) { |
| 578 | // If this is really a nested loop, rip it out into a child loop. Don't do |
| 579 | // this for loops with a giant number of backedges, just factor them into a |
| 580 | // common backedge instead. |
| 581 | if (L->getNumBackEdges() < 8) { |
| 582 | if (Loop *OuterL = separateNestedLoop(L, Preheader, AA, DT, LI, SE, PP)) { |
| 583 | ++NumNested; |
| 584 | // Enqueue the outer loop as it should be processed next in our |
| 585 | // depth-first nest walk. |
| 586 | Worklist.push_back(OuterL); |
| 587 | |
| 588 | // This is a big restructuring change, reprocess the whole loop. |
| 589 | Changed = true; |
| 590 | // GCC doesn't tail recursion eliminate this. |
| 591 | // FIXME: It isn't clear we can't rely on LLVM to TRE this. |
| 592 | goto ReprocessLoop; |
| 593 | } |
| 594 | } |
| 595 | |
| 596 | // If we either couldn't, or didn't want to, identify nesting of the loops, |
| 597 | // insert a new block that all backedges target, then make it jump to the |
| 598 | // loop header. |
| 599 | LoopLatch = insertUniqueBackedgeBlock(L, Preheader, AA, DT, LI); |
| 600 | if (LoopLatch) { |
| 601 | ++NumInserted; |
| 602 | Changed = true; |
| 603 | } |
| 604 | } |
| 605 | |
| 606 | // Scan over the PHI nodes in the loop header. Since they now have only two |
| 607 | // incoming values (the loop is canonicalized), we may have simplified the PHI |
| 608 | // down to 'X = phi [X, Y]', which should be replaced with 'Y'. |
| 609 | PHINode *PN; |
| 610 | for (BasicBlock::iterator I = L->getHeader()->begin(); |
| 611 | (PN = dyn_cast<PHINode>(I++)); ) |
| 612 | if (Value *V = SimplifyInstruction(PN, 0, 0, DT)) { |
| 613 | if (AA) AA->deleteValue(PN); |
| 614 | if (SE) SE->forgetValue(PN); |
| 615 | PN->replaceAllUsesWith(V); |
| 616 | PN->eraseFromParent(); |
| 617 | } |
| 618 | |
| 619 | // If this loop has multiple exits and the exits all go to the same |
| 620 | // block, attempt to merge the exits. This helps several passes, such |
| 621 | // as LoopRotation, which do not support loops with multiple exits. |
| 622 | // SimplifyCFG also does this (and this code uses the same utility |
| 623 | // function), however this code is loop-aware, where SimplifyCFG is |
| 624 | // not. That gives it the advantage of being able to hoist |
| 625 | // loop-invariant instructions out of the way to open up more |
| 626 | // opportunities, and the disadvantage of having the responsibility |
| 627 | // to preserve dominator information. |
| 628 | bool UniqueExit = true; |
| 629 | if (!ExitBlocks.empty()) |
| 630 | for (unsigned i = 1, e = ExitBlocks.size(); i != e; ++i) |
| 631 | if (ExitBlocks[i] != ExitBlocks[0]) { |
| 632 | UniqueExit = false; |
| 633 | break; |
| 634 | } |
| 635 | if (UniqueExit) { |
| 636 | for (unsigned i = 0, e = ExitingBlocks.size(); i != e; ++i) { |
| 637 | BasicBlock *ExitingBlock = ExitingBlocks[i]; |
| 638 | if (!ExitingBlock->getSinglePredecessor()) continue; |
| 639 | BranchInst *BI = dyn_cast<BranchInst>(ExitingBlock->getTerminator()); |
| 640 | if (!BI || !BI->isConditional()) continue; |
| 641 | CmpInst *CI = dyn_cast<CmpInst>(BI->getCondition()); |
| 642 | if (!CI || CI->getParent() != ExitingBlock) continue; |
| 643 | |
| 644 | // Attempt to hoist out all instructions except for the |
| 645 | // comparison and the branch. |
| 646 | bool AllInvariant = true; |
| 647 | bool AnyInvariant = false; |
| 648 | for (BasicBlock::iterator I = ExitingBlock->begin(); &*I != BI; ) { |
| 649 | Instruction *Inst = I++; |
| 650 | // Skip debug info intrinsics. |
| 651 | if (isa<DbgInfoIntrinsic>(Inst)) |
| 652 | continue; |
| 653 | if (Inst == CI) |
| 654 | continue; |
| 655 | if (!L->makeLoopInvariant(Inst, AnyInvariant, |
| 656 | Preheader ? Preheader->getTerminator() : 0)) { |
| 657 | AllInvariant = false; |
| 658 | break; |
| 659 | } |
| 660 | } |
| 661 | if (AnyInvariant) { |
| 662 | Changed = true; |
| 663 | // The loop disposition of all SCEV expressions that depend on any |
| 664 | // hoisted values have also changed. |
| 665 | if (SE) |
| 666 | SE->forgetLoopDispositions(L); |
| 667 | } |
| 668 | if (!AllInvariant) continue; |
| 669 | |
| 670 | // The block has now been cleared of all instructions except for |
| 671 | // a comparison and a conditional branch. SimplifyCFG may be able |
| 672 | // to fold it now. |
| 673 | if (!FoldBranchToCommonDest(BI)) continue; |
| 674 | |
| 675 | // Success. The block is now dead, so remove it from the loop, |
| 676 | // update the dominator tree and delete it. |
| 677 | DEBUG(dbgs() << "LoopSimplify: Eliminating exiting block " |
| 678 | << ExitingBlock->getName() << "\n"); |
| 679 | |
| 680 | // Notify ScalarEvolution before deleting this block. Currently assume the |
| 681 | // parent loop doesn't change (spliting edges doesn't count). If blocks, |
| 682 | // CFG edges, or other values in the parent loop change, then we need call |
| 683 | // to forgetLoop() for the parent instead. |
| 684 | if (SE) |
| 685 | SE->forgetLoop(L); |
| 686 | |
| 687 | assert(pred_begin(ExitingBlock) == pred_end(ExitingBlock)); |
| 688 | Changed = true; |
| 689 | LI->removeBlock(ExitingBlock); |
| 690 | |
| 691 | DomTreeNode *Node = DT->getNode(ExitingBlock); |
| 692 | const std::vector<DomTreeNodeBase<BasicBlock> *> &Children = |
| 693 | Node->getChildren(); |
| 694 | while (!Children.empty()) { |
| 695 | DomTreeNode *Child = Children.front(); |
| 696 | DT->changeImmediateDominator(Child, Node->getIDom()); |
| 697 | } |
| 698 | DT->eraseNode(ExitingBlock); |
| 699 | |
| 700 | BI->getSuccessor(0)->removePredecessor(ExitingBlock); |
| 701 | BI->getSuccessor(1)->removePredecessor(ExitingBlock); |
| 702 | ExitingBlock->eraseFromParent(); |
| 703 | } |
| 704 | } |
| 705 | |
| 706 | return Changed; |
| 707 | } |
| 708 | |
| 709 | bool llvm::simplifyLoop(Loop *L, DominatorTree *DT, LoopInfo *LI, Pass *PP, |
| 710 | AliasAnalysis *AA, ScalarEvolution *SE) { |
| 711 | bool Changed = false; |
| 712 | |
| 713 | // Worklist maintains our depth-first queue of loops in this nest to process. |
| 714 | SmallVector<Loop *, 4> Worklist; |
| 715 | Worklist.push_back(L); |
| 716 | |
| 717 | // Walk the worklist from front to back, pushing newly found sub loops onto |
| 718 | // the back. This will let us process loops from back to front in depth-first |
| 719 | // order. We can use this simple process because loops form a tree. |
| 720 | for (unsigned Idx = 0; Idx != Worklist.size(); ++Idx) { |
| 721 | Loop *L2 = Worklist[Idx]; |
| 722 | for (Loop::iterator I = L2->begin(), E = L2->end(); I != E; ++I) |
| 723 | Worklist.push_back(*I); |
| 724 | } |
| 725 | |
| 726 | while (!Worklist.empty()) |
| 727 | Changed |= simplifyOneLoop(Worklist.pop_back_val(), Worklist, AA, DT, LI, SE, PP); |
| 728 | |
| 729 | return Changed; |
| 730 | } |
| 731 | |
| 732 | namespace { |
| 733 | struct LoopSimplify : public FunctionPass { |
| 734 | static char ID; // Pass identification, replacement for typeid |
| 735 | LoopSimplify() : FunctionPass(ID) { |
| 736 | initializeLoopSimplifyPass(*PassRegistry::getPassRegistry()); |
| 737 | } |
| 738 | |
| 739 | // AA - If we have an alias analysis object to update, this is it, otherwise |
| 740 | // this is null. |
| 741 | AliasAnalysis *AA; |
| 742 | DominatorTree *DT; |
| 743 | LoopInfo *LI; |
| 744 | ScalarEvolution *SE; |
| 745 | |
| 746 | bool runOnFunction(Function &F) override; |
| 747 | |
| 748 | void getAnalysisUsage(AnalysisUsage &AU) const override { |
| 749 | // We need loop information to identify the loops... |
| 750 | AU.addRequired<DominatorTreeWrapperPass>(); |
| 751 | AU.addPreserved<DominatorTreeWrapperPass>(); |
| 752 | |
| 753 | AU.addRequired<LoopInfo>(); |
| 754 | AU.addPreserved<LoopInfo>(); |
| 755 | |
| 756 | AU.addPreserved<AliasAnalysis>(); |
| 757 | AU.addPreserved<ScalarEvolution>(); |
| 758 | AU.addPreserved<DependenceAnalysis>(); |
| 759 | AU.addPreservedID(BreakCriticalEdgesID); // No critical edges added. |
| 760 | } |
| 761 | |
| 762 | /// verifyAnalysis() - Verify LoopSimplifyForm's guarantees. |
| 763 | void verifyAnalysis() const override; |
| 764 | |
| 765 | private: |
| 766 | bool ProcessLoop(Loop *L); |
| 767 | BasicBlock *RewriteLoopExitBlock(Loop *L, BasicBlock *Exit); |
| 768 | Loop *SeparateNestedLoop(Loop *L, BasicBlock *Preheader); |
| 769 | BasicBlock *InsertUniqueBackedgeBlock(Loop *L, BasicBlock *Preheader); |
| 770 | }; |
| 771 | } |
| 772 | |
| 773 | char LoopSimplify::ID = 0; |
| 774 | INITIALIZE_PASS_BEGIN(LoopSimplify, "loop-simplify", |
| 775 | "Canonicalize natural loops", true, false) |
| 776 | INITIALIZE_PASS_DEPENDENCY(DominatorTreeWrapperPass) |
| 777 | INITIALIZE_PASS_DEPENDENCY(LoopInfo) |
| 778 | INITIALIZE_PASS_END(LoopSimplify, "loop-simplify", |
| 779 | "Canonicalize natural loops", true, false) |
| 780 | |
| 781 | // Publicly exposed interface to pass... |
| 782 | char &llvm::LoopSimplifyID = LoopSimplify::ID; |
| 783 | Pass *llvm::createLoopSimplifyPass() { return new LoopSimplify(); } |
| 784 | |
| 785 | /// runOnLoop - Run down all loops in the CFG (recursively, but we could do |
| 786 | /// it in any convenient order) inserting preheaders... |
| 787 | /// |
| 788 | bool LoopSimplify::runOnFunction(Function &F) { |
| 789 | bool Changed = false; |
| 790 | AA = getAnalysisIfAvailable<AliasAnalysis>(); |
| 791 | LI = &getAnalysis<LoopInfo>(); |
| 792 | DT = &getAnalysis<DominatorTreeWrapperPass>().getDomTree(); |
| 793 | SE = getAnalysisIfAvailable<ScalarEvolution>(); |
| 794 | |
| 795 | // Simplify each loop nest in the function. |
| 796 | for (LoopInfo::iterator I = LI->begin(), E = LI->end(); I != E; ++I) |
| 797 | Changed |= simplifyLoop(*I, DT, LI, this, AA, SE); |
| 798 | |
| 799 | return Changed; |
| 800 | } |
| 801 | |
| 802 | // FIXME: Restore this code when we re-enable verification in verifyAnalysis |
| 803 | // below. |
| 804 | #if 0 |
| 805 | static void verifyLoop(Loop *L) { |
| 806 | // Verify subloops. |
| 807 | for (Loop::iterator I = L->begin(), E = L->end(); I != E; ++I) |
| 808 | verifyLoop(*I); |
| 809 | |
Dan Gohman | f4e82d1 | 2009-11-05 21:14:46 +0000 | [diff] [blame] | 810 | // It used to be possible to just assert L->isLoopSimplifyForm(), however |
| 811 | // with the introduction of indirectbr, there are now cases where it's |
| 812 | // not possible to transform a loop as necessary. We can at least check |
| 813 | // that there is an indirectbr near any time there's trouble. |
| 814 | |
| 815 | // Indirectbr can interfere with preheader and unique backedge insertion. |
| 816 | if (!L->getLoopPreheader() || !L->getLoopLatch()) { |
| 817 | bool HasIndBrPred = false; |
| 818 | for (pred_iterator PI = pred_begin(L->getHeader()), |
| 819 | PE = pred_end(L->getHeader()); PI != PE; ++PI) |
| 820 | if (isa<IndirectBrInst>((*PI)->getTerminator())) { |
| 821 | HasIndBrPred = true; |
| 822 | break; |
| 823 | } |
| 824 | assert(HasIndBrPred && |
| 825 | "LoopSimplify has no excuse for missing loop header info!"); |
Duncan Sands | 1f6a329 | 2011-08-12 14:54:45 +0000 | [diff] [blame] | 826 | (void)HasIndBrPred; |
Dan Gohman | f4e82d1 | 2009-11-05 21:14:46 +0000 | [diff] [blame] | 827 | } |
| 828 | |
Bill Wendling | 66af89f | 2011-08-18 21:10:01 +0000 | [diff] [blame] | 829 | // Indirectbr can interfere with exit block canonicalization. |
Dan Gohman | f4e82d1 | 2009-11-05 21:14:46 +0000 | [diff] [blame] | 830 | if (!L->hasDedicatedExits()) { |
| 831 | bool HasIndBrExiting = false; |
| 832 | SmallVector<BasicBlock*, 8> ExitingBlocks; |
| 833 | L->getExitingBlocks(ExitingBlocks); |
Bill Wendling | 0906a7c | 2011-08-17 21:20:43 +0000 | [diff] [blame] | 834 | for (unsigned i = 0, e = ExitingBlocks.size(); i != e; ++i) { |
Dan Gohman | f4e82d1 | 2009-11-05 21:14:46 +0000 | [diff] [blame] | 835 | if (isa<IndirectBrInst>((ExitingBlocks[i])->getTerminator())) { |
| 836 | HasIndBrExiting = true; |
| 837 | break; |
| 838 | } |
Bill Wendling | 0906a7c | 2011-08-17 21:20:43 +0000 | [diff] [blame] | 839 | } |
| 840 | |
Bill Wendling | 66af89f | 2011-08-18 21:10:01 +0000 | [diff] [blame] | 841 | assert(HasIndBrExiting && |
Dan Gohman | f4e82d1 | 2009-11-05 21:14:46 +0000 | [diff] [blame] | 842 | "LoopSimplify has no excuse for missing exit block info!"); |
Bill Wendling | 66af89f | 2011-08-18 21:10:01 +0000 | [diff] [blame] | 843 | (void)HasIndBrExiting; |
Dan Gohman | f4e82d1 | 2009-11-05 21:14:46 +0000 | [diff] [blame] | 844 | } |
Chris Lattner | 38acf9e | 2002-09-26 16:17:31 +0000 | [diff] [blame] | 845 | } |
Stephen Hines | 36b5688 | 2014-04-23 16:57:46 -0700 | [diff] [blame] | 846 | #endif |
| 847 | |
| 848 | void LoopSimplify::verifyAnalysis() const { |
| 849 | // FIXME: This routine is being called mid-way through the loop pass manager |
| 850 | // as loop passes destroy this analysis. That's actually fine, but we have no |
| 851 | // way of expressing that here. Once all of the passes that destroy this are |
| 852 | // hoisted out of the loop pass manager we can add back verification here. |
| 853 | #if 0 |
| 854 | for (LoopInfo::iterator I = LI->begin(), E = LI->end(); I != E; ++I) |
| 855 | verifyLoop(*I); |
| 856 | #endif |
| 857 | } |