blob: 99233dfc2e3c08aacdcef2876a94d5baca441133 [file] [log] [blame]
Evan Chengbbf1db72009-05-07 05:42:24 +00001//===-- CodePlacementOpt.cpp - Code Placement pass. -----------------------===//
Evan Chengfb8075d2008-02-28 00:43:03 +00002//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
Cameron Zwarichf7af3962011-03-02 04:03:46 +000010// This file implements the pass that optimizes code placement and aligns loop
11// headers to target-specific alignment boundaries.
Evan Chengfb8075d2008-02-28 00:43:03 +000012//
13//===----------------------------------------------------------------------===//
14
Evan Chengbbf1db72009-05-07 05:42:24 +000015#define DEBUG_TYPE "code-placement"
Evan Chengfb8075d2008-02-28 00:43:03 +000016#include "llvm/CodeGen/MachineLoopInfo.h"
17#include "llvm/CodeGen/MachineFunctionPass.h"
18#include "llvm/CodeGen/Passes.h"
Evan Cheng45e00102009-05-08 06:34:09 +000019#include "llvm/Target/TargetInstrInfo.h"
Evan Chengfb8075d2008-02-28 00:43:03 +000020#include "llvm/Target/TargetLowering.h"
21#include "llvm/Target/TargetMachine.h"
Evan Chengfb8075d2008-02-28 00:43:03 +000022#include "llvm/Support/Compiler.h"
23#include "llvm/Support/Debug.h"
Evan Cheng45e00102009-05-08 06:34:09 +000024#include "llvm/ADT/Statistic.h"
Evan Chengfb8075d2008-02-28 00:43:03 +000025using namespace llvm;
26
Dan Gohmancd2ae142009-10-15 00:36:22 +000027STATISTIC(NumLoopsAligned, "Number of loops aligned");
Evan Cheng45e00102009-05-08 06:34:09 +000028STATISTIC(NumIntraElim, "Number of intra loop branches eliminated");
29STATISTIC(NumIntraMoved, "Number of intra loop branches moved");
30
Evan Chengfb8075d2008-02-28 00:43:03 +000031namespace {
Evan Chengbbf1db72009-05-07 05:42:24 +000032 class CodePlacementOpt : public MachineFunctionPass {
Evan Cheng7132e122009-05-07 05:49:39 +000033 const MachineLoopInfo *MLI;
Evan Cheng45e00102009-05-08 06:34:09 +000034 const TargetInstrInfo *TII;
35 const TargetLowering *TLI;
36
Evan Chengfb8075d2008-02-28 00:43:03 +000037 public:
38 static char ID;
Owen Anderson90c579d2010-08-06 18:33:48 +000039 CodePlacementOpt() : MachineFunctionPass(ID) {}
Evan Chengfb8075d2008-02-28 00:43:03 +000040
41 virtual bool runOnMachineFunction(MachineFunction &MF);
Evan Chengfb8075d2008-02-28 00:43:03 +000042
43 virtual void getAnalysisUsage(AnalysisUsage &AU) const {
44 AU.addRequired<MachineLoopInfo>();
Evan Cheng8b56a902008-09-22 22:21:38 +000045 AU.addPreservedID(MachineDominatorsID);
Evan Chengfb8075d2008-02-28 00:43:03 +000046 MachineFunctionPass::getAnalysisUsage(AU);
47 }
Evan Cheng7132e122009-05-07 05:49:39 +000048
49 private:
Dan Gohman07adb852009-10-20 04:50:37 +000050 bool HasFallthrough(MachineBasicBlock *MBB);
51 bool HasAnalyzableTerminator(MachineBasicBlock *MBB);
52 void Splice(MachineFunction &MF,
53 MachineFunction::iterator InsertPt,
54 MachineFunction::iterator Begin,
55 MachineFunction::iterator End);
Dan Gohman07adb852009-10-20 04:50:37 +000056 bool EliminateUnconditionalJumpsToTop(MachineFunction &MF,
57 MachineLoop *L);
58 bool MoveDiscontiguousLoopBlocks(MachineFunction &MF,
59 MachineLoop *L);
60 bool OptimizeIntraLoopEdgesInLoopNest(MachineFunction &MF, MachineLoop *L);
61 bool OptimizeIntraLoopEdges(MachineFunction &MF);
Evan Cheng7132e122009-05-07 05:49:39 +000062 bool AlignLoops(MachineFunction &MF);
Dan Gohmancd2ae142009-10-15 00:36:22 +000063 bool AlignLoop(MachineFunction &MF, MachineLoop *L, unsigned Align);
Evan Chengfb8075d2008-02-28 00:43:03 +000064 };
65
Evan Chengbbf1db72009-05-07 05:42:24 +000066 char CodePlacementOpt::ID = 0;
Evan Chengfb8075d2008-02-28 00:43:03 +000067} // end anonymous namespace
68
Andrew Trick1dd8c852012-02-08 21:23:13 +000069char &llvm::CodePlacementOptID = CodePlacementOpt::ID;
70INITIALIZE_PASS(CodePlacementOpt, "code-placement",
71 "Code Placement Optimizer", false, false)
Evan Chengfb8075d2008-02-28 00:43:03 +000072
Dan Gohman07adb852009-10-20 04:50:37 +000073/// HasFallthrough - Test whether the given branch has a fallthrough, either as
74/// a plain fallthrough or as a fallthrough case of a conditional branch.
Evan Cheng45e00102009-05-08 06:34:09 +000075///
Dan Gohman07adb852009-10-20 04:50:37 +000076bool CodePlacementOpt::HasFallthrough(MachineBasicBlock *MBB) {
77 MachineBasicBlock *TBB = 0, *FBB = 0;
78 SmallVector<MachineOperand, 4> Cond;
79 if (TII->AnalyzeBranch(*MBB, TBB, FBB, Cond))
80 return false;
81 // This conditional branch has no fallthrough.
82 if (FBB)
83 return false;
84 // An unconditional branch has no fallthrough.
85 if (Cond.empty() && TBB)
86 return false;
87 // It has a fallthrough.
88 return true;
89}
90
91/// HasAnalyzableTerminator - Test whether AnalyzeBranch will succeed on MBB.
92/// This is called before major changes are begun to test whether it will be
93/// possible to complete the changes.
Evan Cheng45e00102009-05-08 06:34:09 +000094///
Dan Gohman07adb852009-10-20 04:50:37 +000095/// Target-specific code is hereby encouraged to make AnalyzeBranch succeed
96/// whenever possible.
Evan Cheng45e00102009-05-08 06:34:09 +000097///
Dan Gohman07adb852009-10-20 04:50:37 +000098bool CodePlacementOpt::HasAnalyzableTerminator(MachineBasicBlock *MBB) {
99 // Conservatively ignore EH landing pads.
100 if (MBB->isLandingPad()) return false;
101
Dan Gohman07adb852009-10-20 04:50:37 +0000102 // Aggressively handle return blocks and similar constructs.
103 if (MBB->succ_empty()) return true;
Dan Gohman3bdd8de2009-10-17 00:32:43 +0000104
Dan Gohman07adb852009-10-20 04:50:37 +0000105 // Ask the target's AnalyzeBranch if it can handle this block.
106 MachineBasicBlock *TBB = 0, *FBB = 0;
107 SmallVector<MachineOperand, 4> Cond;
Dan Gohmanf3b11aa2010-02-10 20:04:19 +0000108 // Make sure the terminator is understood.
Dan Gohman07adb852009-10-20 04:50:37 +0000109 if (TII->AnalyzeBranch(*MBB, TBB, FBB, Cond))
110 return false;
Dan Gohman49d7f8d2010-02-18 21:25:53 +0000111 // Ignore blocks which look like they might have EH-related control flow.
112 // AnalyzeBranch thinks it knows how to analyze such things, but it doesn't
113 // recognize the possibility of a control transfer through an unwind.
114 // Such blocks contain EH_LABEL instructions, however they may be in the
115 // middle of the block. Instead of searching for them, just check to see
116 // if the CFG disagrees with AnalyzeBranch.
117 if (1u + !Cond.empty() != MBB->succ_size())
118 return false;
Dan Gohman07adb852009-10-20 04:50:37 +0000119 // Make sure we have the option of reversing the condition.
120 if (!Cond.empty() && TII->ReverseBranchCondition(Cond))
121 return false;
122 return true;
123}
124
125/// Splice - Move the sequence of instructions [Begin,End) to just before
126/// InsertPt. Update branch instructions as needed to account for broken
127/// fallthrough edges and to take advantage of newly exposed fallthrough
128/// opportunities.
129///
130void CodePlacementOpt::Splice(MachineFunction &MF,
131 MachineFunction::iterator InsertPt,
132 MachineFunction::iterator Begin,
133 MachineFunction::iterator End) {
134 assert(Begin != MF.begin() && End != MF.begin() && InsertPt != MF.begin() &&
135 "Splice can't change the entry block!");
136 MachineFunction::iterator OldBeginPrior = prior(Begin);
137 MachineFunction::iterator OldEndPrior = prior(End);
138
139 MF.splice(InsertPt, Begin, End);
140
Jim Grosbach7707a0d2009-11-12 03:55:33 +0000141 prior(Begin)->updateTerminator();
142 OldBeginPrior->updateTerminator();
143 OldEndPrior->updateTerminator();
Dan Gohman07adb852009-10-20 04:50:37 +0000144}
Evan Cheng45e00102009-05-08 06:34:09 +0000145
Dan Gohman07adb852009-10-20 04:50:37 +0000146/// EliminateUnconditionalJumpsToTop - Move blocks which unconditionally jump
147/// to the loop top to the top of the loop so that they have a fall through.
148/// This can introduce a branch on entry to the loop, but it can eliminate a
149/// branch within the loop. See the @simple case in
150/// test/CodeGen/X86/loop_blocks.ll for an example of this.
151bool CodePlacementOpt::EliminateUnconditionalJumpsToTop(MachineFunction &MF,
152 MachineLoop *L) {
153 bool Changed = false;
154 MachineBasicBlock *TopMBB = L->getTopBlock();
155
156 bool BotHasFallthrough = HasFallthrough(L->getBottomBlock());
157
158 if (TopMBB == MF.begin() ||
159 HasAnalyzableTerminator(prior(MachineFunction::iterator(TopMBB)))) {
160 new_top:
161 for (MachineBasicBlock::pred_iterator PI = TopMBB->pred_begin(),
162 PE = TopMBB->pred_end(); PI != PE; ++PI) {
163 MachineBasicBlock *Pred = *PI;
164 if (Pred == TopMBB) continue;
165 if (HasFallthrough(Pred)) continue;
166 if (!L->contains(Pred)) continue;
167
168 // Verify that we can analyze all the loop entry edges before beginning
169 // any changes which will require us to be able to analyze them.
170 if (Pred == MF.begin())
171 continue;
172 if (!HasAnalyzableTerminator(Pred))
173 continue;
174 if (!HasAnalyzableTerminator(prior(MachineFunction::iterator(Pred))))
175 continue;
176
177 // Move the block.
Dan Gohmanba1fe142010-06-07 22:32:10 +0000178 DEBUG(dbgs() << "CGP: Moving blocks starting at BB#" << Pred->getNumber()
179 << " to top of loop.\n");
Dan Gohman3bdd8de2009-10-17 00:32:43 +0000180 Changed = true;
Dan Gohman3bdd8de2009-10-17 00:32:43 +0000181
Dan Gohman07adb852009-10-20 04:50:37 +0000182 // Move it and all the blocks that can reach it via fallthrough edges
183 // exclusively, to keep existing fallthrough edges intact.
184 MachineFunction::iterator Begin = Pred;
Chris Lattner7896c9f2009-12-03 00:50:42 +0000185 MachineFunction::iterator End = llvm::next(Begin);
Dan Gohman07adb852009-10-20 04:50:37 +0000186 while (Begin != MF.begin()) {
187 MachineFunction::iterator Prior = prior(Begin);
188 if (Prior == MF.begin())
189 break;
190 // Stop when a non-fallthrough edge is found.
191 if (!HasFallthrough(Prior))
192 break;
193 // Stop if a block which could fall-through out of the loop is found.
194 if (Prior->isSuccessor(End))
195 break;
196 // If we've reached the top, stop scanning.
197 if (Prior == MachineFunction::iterator(TopMBB)) {
198 // We know top currently has a fall through (because we just checked
199 // it) which would be lost if we do the transformation, so it isn't
200 // worthwhile to do the transformation unless it would expose a new
201 // fallthrough edge.
202 if (!Prior->isSuccessor(End))
203 goto next_pred;
Benjamin Kramerd9b0b022012-06-02 10:20:22 +0000204 // Otherwise we can stop scanning and proceed to move the blocks.
Dan Gohman3bdd8de2009-10-17 00:32:43 +0000205 break;
206 }
Dan Gohman07adb852009-10-20 04:50:37 +0000207 // If we hit a switch or something complicated, don't move anything
208 // for this predecessor.
209 if (!HasAnalyzableTerminator(prior(MachineFunction::iterator(Prior))))
210 break;
211 // Ok, the block prior to Begin will be moved along with the rest.
212 // Extend the range to include it.
213 Begin = Prior;
214 ++NumIntraMoved;
Anton Korobeynikov766fc1d2009-10-19 18:21:09 +0000215 }
216
Dan Gohman07adb852009-10-20 04:50:37 +0000217 // Move the blocks.
218 Splice(MF, TopMBB, Begin, End);
Anton Korobeynikov766fc1d2009-10-19 18:21:09 +0000219
Dan Gohman07adb852009-10-20 04:50:37 +0000220 // Update TopMBB.
221 TopMBB = L->getTopBlock();
222
223 // We have a new loop top. Iterate on it. We shouldn't have to do this
224 // too many times if BranchFolding has done a reasonable job.
225 goto new_top;
226 next_pred:;
Anton Korobeynikov766fc1d2009-10-19 18:21:09 +0000227 }
Anton Korobeynikov766fc1d2009-10-19 18:21:09 +0000228 }
229
Dan Gohman07adb852009-10-20 04:50:37 +0000230 // If the loop previously didn't exit with a fall-through and it now does,
231 // we eliminated a branch.
232 if (Changed &&
233 !BotHasFallthrough &&
234 HasFallthrough(L->getBottomBlock())) {
235 ++NumIntraElim;
Dan Gohman07adb852009-10-20 04:50:37 +0000236 }
237
238 return Changed;
239}
240
241/// MoveDiscontiguousLoopBlocks - Move any loop blocks that are not in the
242/// portion of the loop contiguous with the header. This usually makes the loop
243/// contiguous, provided that AnalyzeBranch can handle all the relevant
244/// branching. See the @cfg_islands case in test/CodeGen/X86/loop_blocks.ll
245/// for an example of this.
246bool CodePlacementOpt::MoveDiscontiguousLoopBlocks(MachineFunction &MF,
247 MachineLoop *L) {
248 bool Changed = false;
249 MachineBasicBlock *TopMBB = L->getTopBlock();
250 MachineBasicBlock *BotMBB = L->getBottomBlock();
251
252 // Determine a position to move orphaned loop blocks to. If TopMBB is not
253 // entered via fallthrough and BotMBB is exited via fallthrough, prepend them
Chris Lattner7a2bdde2011-04-15 05:18:47 +0000254 // to the top of the loop to avoid losing that fallthrough. Otherwise append
Dan Gohman07adb852009-10-20 04:50:37 +0000255 // them to the bottom, even if it previously had a fallthrough, on the theory
256 // that it's worth an extra branch to keep the loop contiguous.
Chris Lattner7896c9f2009-12-03 00:50:42 +0000257 MachineFunction::iterator InsertPt =
258 llvm::next(MachineFunction::iterator(BotMBB));
Dan Gohman07adb852009-10-20 04:50:37 +0000259 bool InsertAtTop = false;
260 if (TopMBB != MF.begin() &&
261 !HasFallthrough(prior(MachineFunction::iterator(TopMBB))) &&
262 HasFallthrough(BotMBB)) {
263 InsertPt = TopMBB;
264 InsertAtTop = true;
265 }
266
267 // Keep a record of which blocks are in the portion of the loop contiguous
268 // with the loop header.
269 SmallPtrSet<MachineBasicBlock *, 8> ContiguousBlocks;
270 for (MachineFunction::iterator I = TopMBB,
Chris Lattner7896c9f2009-12-03 00:50:42 +0000271 E = llvm::next(MachineFunction::iterator(BotMBB)); I != E; ++I)
Dan Gohman07adb852009-10-20 04:50:37 +0000272 ContiguousBlocks.insert(I);
273
274 // Find non-contigous blocks and fix them.
275 if (InsertPt != MF.begin() && HasAnalyzableTerminator(prior(InsertPt)))
276 for (MachineLoop::block_iterator BI = L->block_begin(), BE = L->block_end();
277 BI != BE; ++BI) {
278 MachineBasicBlock *BB = *BI;
279
280 // Verify that we can analyze all the loop entry edges before beginning
281 // any changes which will require us to be able to analyze them.
282 if (!HasAnalyzableTerminator(BB))
283 continue;
284 if (!HasAnalyzableTerminator(prior(MachineFunction::iterator(BB))))
285 continue;
286
287 // If the layout predecessor is part of the loop, this block will be
288 // processed along with it. This keeps them in their relative order.
289 if (BB != MF.begin() &&
290 L->contains(prior(MachineFunction::iterator(BB))))
291 continue;
292
293 // Check to see if this block is already contiguous with the main
294 // portion of the loop.
295 if (!ContiguousBlocks.insert(BB))
296 continue;
297
298 // Move the block.
Dan Gohmanba1fe142010-06-07 22:32:10 +0000299 DEBUG(dbgs() << "CGP: Moving blocks starting at BB#" << BB->getNumber()
300 << " to be contiguous with loop.\n");
Dan Gohman07adb852009-10-20 04:50:37 +0000301 Changed = true;
302
303 // Process this block and all loop blocks contiguous with it, to keep
304 // them in their relative order.
305 MachineFunction::iterator Begin = BB;
Chris Lattner7896c9f2009-12-03 00:50:42 +0000306 MachineFunction::iterator End = llvm::next(MachineFunction::iterator(BB));
Dan Gohman07adb852009-10-20 04:50:37 +0000307 for (; End != MF.end(); ++End) {
308 if (!L->contains(End)) break;
309 if (!HasAnalyzableTerminator(End)) break;
310 ContiguousBlocks.insert(End);
311 ++NumIntraMoved;
312 }
313
314 // If we're inserting at the bottom of the loop, and the code we're
315 // moving originally had fall-through successors, bring the sucessors
316 // up with the loop blocks to preserve the fall-through edges.
317 if (!InsertAtTop)
318 for (; End != MF.end(); ++End) {
319 if (L->contains(End)) break;
320 if (!HasAnalyzableTerminator(End)) break;
321 if (!HasFallthrough(prior(End))) break;
322 }
323
324 // Move the blocks. This may invalidate TopMBB and/or BotMBB, but
325 // we don't need them anymore at this point.
326 Splice(MF, InsertPt, Begin, End);
327 }
328
329 return Changed;
330}
331
332/// OptimizeIntraLoopEdgesInLoopNest - Reposition loop blocks to minimize
333/// intra-loop branching and to form contiguous loops.
334///
335/// This code takes the approach of making minor changes to the existing
336/// layout to fix specific loop-oriented problems. Also, it depends on
337/// AnalyzeBranch, which can't understand complex control instructions.
338///
339bool CodePlacementOpt::OptimizeIntraLoopEdgesInLoopNest(MachineFunction &MF,
340 MachineLoop *L) {
341 bool Changed = false;
342
343 // Do optimization for nested loops.
344 for (MachineLoop::iterator I = L->begin(), E = L->end(); I != E; ++I)
345 Changed |= OptimizeIntraLoopEdgesInLoopNest(MF, *I);
346
347 // Do optimization for this loop.
348 Changed |= EliminateUnconditionalJumpsToTop(MF, L);
349 Changed |= MoveDiscontiguousLoopBlocks(MF, L);
350
351 return Changed;
352}
353
354/// OptimizeIntraLoopEdges - Reposition loop blocks to minimize
355/// intra-loop branching and to form contiguous loops.
356///
357bool CodePlacementOpt::OptimizeIntraLoopEdges(MachineFunction &MF) {
358 bool Changed = false;
359
360 if (!TLI->shouldOptimizeCodePlacement())
361 return Changed;
362
363 // Do optimization for each loop in the function.
364 for (MachineLoopInfo::iterator I = MLI->begin(), E = MLI->end();
365 I != E; ++I)
366 if (!(*I)->getParentLoop())
367 Changed |= OptimizeIntraLoopEdgesInLoopNest(MF, *I);
368
Evan Cheng45e00102009-05-08 06:34:09 +0000369 return Changed;
370}
371
Evan Cheng7132e122009-05-07 05:49:39 +0000372/// AlignLoops - Align loop headers to target preferred alignments.
373///
374bool CodePlacementOpt::AlignLoops(MachineFunction &MF) {
Evan Cheng45e00102009-05-08 06:34:09 +0000375 const Function *F = MF.getFunction();
376 if (F->hasFnAttr(Attribute::OptimizeForSize))
Evan Cheng4f658e92008-02-29 17:52:15 +0000377 return false;
378
379 unsigned Align = TLI->getPrefLoopAlignment();
Evan Chengfb8075d2008-02-28 00:43:03 +0000380 if (!Align)
381 return false; // Don't care about loop alignment.
382
Evan Cheng7132e122009-05-07 05:49:39 +0000383 bool Changed = false;
Dan Gohmancd2ae142009-10-15 00:36:22 +0000384
385 for (MachineLoopInfo::iterator I = MLI->begin(), E = MLI->end();
386 I != E; ++I)
387 Changed |= AlignLoop(MF, *I, Align);
388
389 return Changed;
390}
391
Dan Gohman07adb852009-10-20 04:50:37 +0000392/// AlignLoop - Align loop headers to target preferred alignments.
393///
Dan Gohmancd2ae142009-10-15 00:36:22 +0000394bool CodePlacementOpt::AlignLoop(MachineFunction &MF, MachineLoop *L,
395 unsigned Align) {
396 bool Changed = false;
397
398 // Do alignment for nested loops.
399 for (MachineLoop::iterator I = L->begin(), E = L->end(); I != E; ++I)
400 Changed |= AlignLoop(MF, *I, Align);
401
Dan Gohman07adb852009-10-20 04:50:37 +0000402 L->getTopBlock()->setAlignment(Align);
Dan Gohmancd2ae142009-10-15 00:36:22 +0000403 Changed = true;
404 ++NumLoopsAligned;
405
Evan Cheng7132e122009-05-07 05:49:39 +0000406 return Changed;
407}
408
409bool CodePlacementOpt::runOnMachineFunction(MachineFunction &MF) {
410 MLI = &getAnalysis<MachineLoopInfo>();
411 if (MLI->empty())
412 return false; // No loops.
413
Evan Cheng45e00102009-05-08 06:34:09 +0000414 TLI = MF.getTarget().getTargetLowering();
415 TII = MF.getTarget().getInstrInfo();
416
Dan Gohman07adb852009-10-20 04:50:37 +0000417 bool Changed = OptimizeIntraLoopEdges(MF);
Evan Cheng45e00102009-05-08 06:34:09 +0000418
Evan Cheng7132e122009-05-07 05:49:39 +0000419 Changed |= AlignLoops(MF);
420
421 return Changed;
Evan Chengfb8075d2008-02-28 00:43:03 +0000422}