Evan Cheng | bbf1db7 | 2009-05-07 05:42:24 +0000 | [diff] [blame] | 1 | //===-- CodePlacementOpt.cpp - Code Placement pass. -----------------------===// |
Evan Cheng | fb8075d | 2008-02-28 00:43:03 +0000 | [diff] [blame] | 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
| 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
| 9 | // |
Evan Cheng | bbf1db7 | 2009-05-07 05:42:24 +0000 | [diff] [blame] | 10 | // This file implements the pass that optimize code placement and align loop |
| 11 | // headers to target specific alignment boundary. |
Evan Cheng | fb8075d | 2008-02-28 00:43:03 +0000 | [diff] [blame] | 12 | // |
| 13 | //===----------------------------------------------------------------------===// |
| 14 | |
Evan Cheng | bbf1db7 | 2009-05-07 05:42:24 +0000 | [diff] [blame] | 15 | #define DEBUG_TYPE "code-placement" |
Evan Cheng | fb8075d | 2008-02-28 00:43:03 +0000 | [diff] [blame] | 16 | #include "llvm/CodeGen/MachineLoopInfo.h" |
| 17 | #include "llvm/CodeGen/MachineFunctionPass.h" |
| 18 | #include "llvm/CodeGen/Passes.h" |
Evan Cheng | 45e0010 | 2009-05-08 06:34:09 +0000 | [diff] [blame] | 19 | #include "llvm/Target/TargetInstrInfo.h" |
Evan Cheng | fb8075d | 2008-02-28 00:43:03 +0000 | [diff] [blame] | 20 | #include "llvm/Target/TargetLowering.h" |
| 21 | #include "llvm/Target/TargetMachine.h" |
Evan Cheng | 45e0010 | 2009-05-08 06:34:09 +0000 | [diff] [blame] | 22 | #include "llvm/Support/CommandLine.h" |
Evan Cheng | fb8075d | 2008-02-28 00:43:03 +0000 | [diff] [blame] | 23 | #include "llvm/Support/Compiler.h" |
| 24 | #include "llvm/Support/Debug.h" |
Evan Cheng | 45e0010 | 2009-05-08 06:34:09 +0000 | [diff] [blame] | 25 | #include "llvm/ADT/Statistic.h" |
Evan Cheng | fb8075d | 2008-02-28 00:43:03 +0000 | [diff] [blame] | 26 | using namespace llvm; |
| 27 | |
Evan Cheng | 45e0010 | 2009-05-08 06:34:09 +0000 | [diff] [blame] | 28 | static cl::opt<bool> |
| 29 | OptLoopBBPlacement("opt-loop-bb-placement", |
| 30 | cl::init(false), cl::Hidden, |
| 31 | cl::desc("Optimize block placements in loops")); |
| 32 | |
| 33 | STATISTIC(NumHeaderAligned, "Number of loop header aligned"); |
| 34 | STATISTIC(NumIntraElim, "Number of intra loop branches eliminated"); |
| 35 | STATISTIC(NumIntraMoved, "Number of intra loop branches moved"); |
| 36 | |
Evan Cheng | fb8075d | 2008-02-28 00:43:03 +0000 | [diff] [blame] | 37 | namespace { |
Evan Cheng | bbf1db7 | 2009-05-07 05:42:24 +0000 | [diff] [blame] | 38 | class CodePlacementOpt : public MachineFunctionPass { |
Evan Cheng | 7132e12 | 2009-05-07 05:49:39 +0000 | [diff] [blame] | 39 | const MachineLoopInfo *MLI; |
Evan Cheng | 45e0010 | 2009-05-08 06:34:09 +0000 | [diff] [blame] | 40 | const TargetInstrInfo *TII; |
| 41 | const TargetLowering *TLI; |
| 42 | |
| 43 | /// ChangedMBBs - BBs which are modified by OptimizeIntraLoopEdges. |
| 44 | SmallPtrSet<MachineBasicBlock*, 8> ChangedMBBs; |
| 45 | |
| 46 | /// UncondJmpMBBs - A list of BBs which are in loops and end with |
| 47 | /// unconditional branches. |
| 48 | SmallVector<std::pair<MachineBasicBlock*,MachineBasicBlock*>, 4> |
| 49 | UncondJmpMBBs; |
| 50 | |
| 51 | /// LoopHeaders - A list of BBs which are loop headers. |
| 52 | SmallVector<MachineBasicBlock*, 4> LoopHeaders; |
Evan Cheng | 7132e12 | 2009-05-07 05:49:39 +0000 | [diff] [blame] | 53 | |
Evan Cheng | fb8075d | 2008-02-28 00:43:03 +0000 | [diff] [blame] | 54 | public: |
| 55 | static char ID; |
Evan Cheng | bbf1db7 | 2009-05-07 05:42:24 +0000 | [diff] [blame] | 56 | CodePlacementOpt() : MachineFunctionPass(&ID) {} |
Evan Cheng | fb8075d | 2008-02-28 00:43:03 +0000 | [diff] [blame] | 57 | |
| 58 | virtual bool runOnMachineFunction(MachineFunction &MF); |
Evan Cheng | bbf1db7 | 2009-05-07 05:42:24 +0000 | [diff] [blame] | 59 | virtual const char *getPassName() const { |
| 60 | return "Code Placement Optimizater"; |
| 61 | } |
Evan Cheng | fb8075d | 2008-02-28 00:43:03 +0000 | [diff] [blame] | 62 | |
| 63 | virtual void getAnalysisUsage(AnalysisUsage &AU) const { |
| 64 | AU.addRequired<MachineLoopInfo>(); |
Evan Cheng | 8b56a90 | 2008-09-22 22:21:38 +0000 | [diff] [blame] | 65 | AU.addPreservedID(MachineDominatorsID); |
Evan Cheng | fb8075d | 2008-02-28 00:43:03 +0000 | [diff] [blame] | 66 | MachineFunctionPass::getAnalysisUsage(AU); |
| 67 | } |
Evan Cheng | 7132e12 | 2009-05-07 05:49:39 +0000 | [diff] [blame] | 68 | |
| 69 | private: |
Evan Cheng | 45e0010 | 2009-05-08 06:34:09 +0000 | [diff] [blame] | 70 | bool OptimizeIntraLoopEdges(); |
Evan Cheng | 7132e12 | 2009-05-07 05:49:39 +0000 | [diff] [blame] | 71 | bool AlignLoops(MachineFunction &MF); |
Evan Cheng | fb8075d | 2008-02-28 00:43:03 +0000 | [diff] [blame] | 72 | }; |
| 73 | |
Evan Cheng | bbf1db7 | 2009-05-07 05:42:24 +0000 | [diff] [blame] | 74 | char CodePlacementOpt::ID = 0; |
Evan Cheng | fb8075d | 2008-02-28 00:43:03 +0000 | [diff] [blame] | 75 | } // end anonymous namespace |
| 76 | |
Evan Cheng | bbf1db7 | 2009-05-07 05:42:24 +0000 | [diff] [blame] | 77 | FunctionPass *llvm::createCodePlacementOptPass() { |
| 78 | return new CodePlacementOpt(); |
| 79 | } |
Evan Cheng | fb8075d | 2008-02-28 00:43:03 +0000 | [diff] [blame] | 80 | |
Evan Cheng | 45e0010 | 2009-05-08 06:34:09 +0000 | [diff] [blame] | 81 | /// OptimizeBackEdges - Place loop back edges to move unconditional branches |
| 82 | /// out of the loop. |
| 83 | /// |
| 84 | /// A: |
| 85 | /// ... |
| 86 | /// <fallthrough to B> |
| 87 | /// |
| 88 | /// B: --> loop header |
| 89 | /// ... |
| 90 | /// jcc <cond> C, [exit] |
| 91 | /// |
| 92 | /// C: |
| 93 | /// ... |
| 94 | /// jmp B |
| 95 | /// |
| 96 | /// ==> |
| 97 | /// |
| 98 | /// A: |
| 99 | /// ... |
| 100 | /// jmp B |
| 101 | /// |
| 102 | /// C: --> new loop header |
| 103 | /// ... |
| 104 | /// <fallthough to B> |
| 105 | /// |
| 106 | /// B: |
| 107 | /// ... |
| 108 | /// jcc <cond> C, [exit] |
| 109 | /// |
| 110 | bool CodePlacementOpt::OptimizeIntraLoopEdges() { |
| 111 | if (!OptLoopBBPlacement) |
| 112 | return false; |
| 113 | |
| 114 | bool Changed = false; |
| 115 | for (unsigned i = 0, e = UncondJmpMBBs.size(); i != e; ++i) { |
| 116 | MachineBasicBlock *MBB = UncondJmpMBBs[i].first; |
| 117 | MachineBasicBlock *SuccMBB = UncondJmpMBBs[i].second; |
| 118 | MachineLoop *L = MLI->getLoopFor(MBB); |
| 119 | assert(L && "BB is expected to be in a loop!"); |
| 120 | |
| 121 | if (ChangedMBBs.count(MBB)) { |
| 122 | // BB has been modified, re-analyze. |
| 123 | MachineBasicBlock *TBB = 0, *FBB = 0; |
| 124 | SmallVector<MachineOperand, 4> Cond; |
| 125 | if (TII->AnalyzeBranch(*MBB, TBB, FBB, Cond) || !Cond.empty()) |
| 126 | continue; |
| 127 | if (MLI->getLoopFor(TBB) != L || TBB->isLandingPad()) |
| 128 | continue; |
| 129 | SuccMBB = TBB; |
| 130 | } else { |
| 131 | assert(MLI->getLoopFor(SuccMBB) == L && |
| 132 | "Successor is not in the same loop!"); |
| 133 | } |
| 134 | |
| 135 | if (MBB->isLayoutSuccessor(SuccMBB)) { |
| 136 | // Successor is right after MBB, just eliminate the unconditional jmp. |
| 137 | // Can this happen? |
| 138 | TII->RemoveBranch(*MBB); |
| 139 | ChangedMBBs.insert(MBB); |
| 140 | ++NumIntraElim; |
| 141 | continue; |
| 142 | } |
| 143 | |
| 144 | // Now check if the predecessor is fallthrough from any BB. If there is, |
| 145 | // that BB should be from outside the loop since edge will become a jmp. |
| 146 | bool OkToMove = true; |
| 147 | MachineBasicBlock *FtMBB = 0, *FtTBB = 0, *FtFBB = 0; |
| 148 | SmallVector<MachineOperand, 4> FtCond; |
| 149 | for (MachineBasicBlock::pred_iterator PI = SuccMBB->pred_begin(), |
| 150 | PE = SuccMBB->pred_end(); PI != PE; ++PI) { |
| 151 | MachineBasicBlock *PredMBB = *PI; |
| 152 | if (PredMBB->isLayoutSuccessor(SuccMBB)) { |
| 153 | if (TII->AnalyzeBranch(*PredMBB, FtTBB, FtFBB, FtCond)) { |
| 154 | OkToMove = false; |
| 155 | break; |
| 156 | } |
| 157 | if (!FtTBB) |
| 158 | FtTBB = SuccMBB; |
| 159 | else if (!FtFBB) { |
| 160 | assert(FtFBB != SuccMBB && "Unexpected control flow!"); |
| 161 | FtFBB = SuccMBB; |
| 162 | } |
| 163 | |
| 164 | // A fallthrough. |
| 165 | FtMBB = PredMBB; |
| 166 | MachineLoop *PL = MLI->getLoopFor(PredMBB); |
| 167 | if (PL && (PL == L || PL->getLoopDepth() >= L->getLoopDepth())) { |
| 168 | OkToMove = false; |
| 169 | break; |
| 170 | } |
| 171 | } |
| 172 | } |
| 173 | |
| 174 | if (!OkToMove) |
| 175 | continue; |
| 176 | |
| 177 | // Is it profitable? If SuccMBB can fallthrough itself, that can be changed |
| 178 | // into a jmp. |
| 179 | MachineBasicBlock *TBB = 0, *FBB = 0; |
| 180 | SmallVector<MachineOperand, 4> Cond; |
| 181 | if (TII->AnalyzeBranch(*SuccMBB, TBB, FBB, Cond)) |
| 182 | continue; |
| 183 | if (!TBB && Cond.empty()) |
| 184 | TBB = next(MachineFunction::iterator(SuccMBB)); |
| 185 | else if (!FBB && !Cond.empty()) |
| 186 | FBB = next(MachineFunction::iterator(SuccMBB)); |
| 187 | |
| 188 | // This calculate the cost of the transformation. Also, it finds the *only* |
| 189 | // intra-loop edge if there is one. |
| 190 | int Cost = 0; |
| 191 | bool HasOneIntraSucc = true; |
| 192 | MachineBasicBlock *IntraSucc = 0; |
| 193 | for (MachineBasicBlock::succ_iterator SI = SuccMBB->succ_begin(), |
| 194 | SE = SuccMBB->succ_end(); SI != SE; ++SI) { |
| 195 | MachineBasicBlock *SSMBB = *SI; |
| 196 | if (MLI->getLoopFor(SSMBB) == L) { |
| 197 | if (!IntraSucc) |
| 198 | IntraSucc = SSMBB; |
| 199 | else |
| 200 | HasOneIntraSucc = false; |
| 201 | } |
| 202 | |
| 203 | if (SuccMBB->isLayoutSuccessor(SSMBB)) |
| 204 | // This will become a jmp. |
| 205 | ++Cost; |
Nick Lewycky | 0ab2dce | 2009-05-08 06:57:41 +0000 | [diff] [blame] | 206 | else if (MBB->isLayoutSuccessor(SSMBB)) { |
Evan Cheng | 45e0010 | 2009-05-08 06:34:09 +0000 | [diff] [blame] | 207 | // One of the successor will become the new fallthrough. |
| 208 | if (SSMBB == FBB) { |
| 209 | FBB = 0; |
| 210 | --Cost; |
| 211 | } else if (!FBB && SSMBB == TBB && Cond.empty()) { |
| 212 | TBB = 0; |
| 213 | --Cost; |
Evan Cheng | 4b7f7a6 | 2009-05-08 09:35:53 +0000 | [diff] [blame^] | 214 | } else if (!Cond.empty() && !TII->ReverseBranchCondition(Cond)) { |
| 215 | assert(SSMBB == TBB); |
Evan Cheng | 45e0010 | 2009-05-08 06:34:09 +0000 | [diff] [blame] | 216 | TBB = FBB; |
| 217 | FBB = 0; |
| 218 | --Cost; |
| 219 | } |
Nick Lewycky | 0ab2dce | 2009-05-08 06:57:41 +0000 | [diff] [blame] | 220 | } |
Evan Cheng | 45e0010 | 2009-05-08 06:34:09 +0000 | [diff] [blame] | 221 | } |
| 222 | if (Cost) |
| 223 | continue; |
| 224 | |
| 225 | // Now, let's move the successor to below the BB to eliminate the jmp. |
| 226 | SuccMBB->moveAfter(MBB); |
| 227 | TII->RemoveBranch(*MBB); |
| 228 | TII->RemoveBranch(*SuccMBB); |
| 229 | if (TBB) |
| 230 | TII->InsertBranch(*SuccMBB, TBB, FBB, Cond); |
| 231 | ChangedMBBs.insert(MBB); |
| 232 | ChangedMBBs.insert(SuccMBB); |
| 233 | if (FtMBB) { |
| 234 | TII->RemoveBranch(*FtMBB); |
| 235 | TII->InsertBranch(*FtMBB, FtTBB, FtFBB, FtCond); |
| 236 | ChangedMBBs.insert(FtMBB); |
| 237 | } |
| 238 | |
| 239 | // If BB is the loop latch, we may have a new loop headr. |
| 240 | if (MBB == L->getLoopLatch()) { |
| 241 | assert(MLI->isLoopHeader(SuccMBB) && |
| 242 | "Only succ of loop latch is not the header?"); |
| 243 | if (HasOneIntraSucc && IntraSucc) |
| 244 | std::replace(LoopHeaders.begin(),LoopHeaders.end(), SuccMBB, IntraSucc); |
| 245 | } |
| 246 | } |
| 247 | |
| 248 | ++NumIntraMoved; |
| 249 | return Changed; |
| 250 | } |
| 251 | |
Evan Cheng | 7132e12 | 2009-05-07 05:49:39 +0000 | [diff] [blame] | 252 | /// AlignLoops - Align loop headers to target preferred alignments. |
| 253 | /// |
| 254 | bool CodePlacementOpt::AlignLoops(MachineFunction &MF) { |
Evan Cheng | 45e0010 | 2009-05-08 06:34:09 +0000 | [diff] [blame] | 255 | const Function *F = MF.getFunction(); |
| 256 | if (F->hasFnAttr(Attribute::OptimizeForSize)) |
Evan Cheng | 4f658e9 | 2008-02-29 17:52:15 +0000 | [diff] [blame] | 257 | return false; |
| 258 | |
| 259 | unsigned Align = TLI->getPrefLoopAlignment(); |
Evan Cheng | fb8075d | 2008-02-28 00:43:03 +0000 | [diff] [blame] | 260 | if (!Align) |
| 261 | return false; // Don't care about loop alignment. |
| 262 | |
Evan Cheng | 45e0010 | 2009-05-08 06:34:09 +0000 | [diff] [blame] | 263 | // Make sure blocks are numbered in order |
| 264 | MF.RenumberBlocks(); |
Devang Patel | 4ae641f | 2008-10-01 23:18:38 +0000 | [diff] [blame] | 265 | |
Evan Cheng | 7132e12 | 2009-05-07 05:49:39 +0000 | [diff] [blame] | 266 | bool Changed = false; |
Evan Cheng | 45e0010 | 2009-05-08 06:34:09 +0000 | [diff] [blame] | 267 | for (unsigned i = 0, e = LoopHeaders.size(); i != e; ++i) { |
| 268 | MachineBasicBlock *HeaderMBB = LoopHeaders[i]; |
| 269 | MachineBasicBlock *PredMBB = prior(MachineFunction::iterator(HeaderMBB)); |
| 270 | if (MLI->getLoopFor(HeaderMBB) != MLI->getLoopFor(PredMBB)) { |
| 271 | // If previously BB is in the same loop, don't align this BB. We want |
| 272 | // to prevent adding noop's inside a loop. |
| 273 | HeaderMBB->setAlignment(Align); |
Evan Cheng | 7132e12 | 2009-05-07 05:49:39 +0000 | [diff] [blame] | 274 | Changed = true; |
Evan Cheng | 45e0010 | 2009-05-08 06:34:09 +0000 | [diff] [blame] | 275 | ++NumHeaderAligned; |
Evan Cheng | df90841 | 2008-11-27 01:16:00 +0000 | [diff] [blame] | 276 | } |
Evan Cheng | fb8075d | 2008-02-28 00:43:03 +0000 | [diff] [blame] | 277 | } |
| 278 | |
Evan Cheng | 7132e12 | 2009-05-07 05:49:39 +0000 | [diff] [blame] | 279 | return Changed; |
| 280 | } |
| 281 | |
| 282 | bool CodePlacementOpt::runOnMachineFunction(MachineFunction &MF) { |
| 283 | MLI = &getAnalysis<MachineLoopInfo>(); |
| 284 | if (MLI->empty()) |
| 285 | return false; // No loops. |
| 286 | |
Evan Cheng | 45e0010 | 2009-05-08 06:34:09 +0000 | [diff] [blame] | 287 | TLI = MF.getTarget().getTargetLowering(); |
| 288 | TII = MF.getTarget().getInstrInfo(); |
| 289 | |
| 290 | // Analyze the BBs first and keep track of loop headers and BBs that |
| 291 | // end with an unconditional jmp to another block in the same loop. |
| 292 | for (MachineFunction::iterator I = MF.begin(), E = MF.end(); I != E; ++I) { |
| 293 | MachineBasicBlock *MBB = I; |
| 294 | if (MBB->isLandingPad()) |
| 295 | continue; |
| 296 | MachineLoop *L = MLI->getLoopFor(MBB); |
| 297 | if (!L) |
| 298 | continue; |
| 299 | if (MLI->isLoopHeader(MBB)) |
| 300 | LoopHeaders.push_back(MBB); |
| 301 | |
| 302 | MachineBasicBlock *TBB = 0, *FBB = 0; |
| 303 | SmallVector<MachineOperand, 4> Cond; |
| 304 | if (TII->AnalyzeBranch(*MBB, TBB, FBB, Cond) || !Cond.empty()) |
| 305 | continue; |
| 306 | if (MLI->getLoopFor(TBB) == L && !TBB->isLandingPad()) |
| 307 | UncondJmpMBBs.push_back(std::make_pair(MBB, TBB)); |
| 308 | } |
| 309 | |
| 310 | bool Changed = OptimizeIntraLoopEdges(); |
| 311 | |
Evan Cheng | 7132e12 | 2009-05-07 05:49:39 +0000 | [diff] [blame] | 312 | Changed |= AlignLoops(MF); |
| 313 | |
Evan Cheng | 45e0010 | 2009-05-08 06:34:09 +0000 | [diff] [blame] | 314 | ChangedMBBs.clear(); |
| 315 | UncondJmpMBBs.clear(); |
| 316 | LoopHeaders.clear(); |
| 317 | |
Evan Cheng | 7132e12 | 2009-05-07 05:49:39 +0000 | [diff] [blame] | 318 | return Changed; |
Evan Cheng | fb8075d | 2008-02-28 00:43:03 +0000 | [diff] [blame] | 319 | } |