blob: 38013476188d8835c8d9d365475bcec77dbca2c8 [file] [log] [blame]
Tom Stellard6b7d99d2012-12-19 22:10:31 +00001//===-- AMDGPUStructurizeCFG.cpp - ------------------===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10/// \file
11/// The pass implemented in this file transforms the programs control flow
12/// graph into a form that's suitable for code generation on hardware that
13/// implements control flow by execution masking. This currently includes all
14/// AMD GPUs but may as well be useful for other types of hardware.
15//
16//===----------------------------------------------------------------------===//
17
18#include "AMDGPU.h"
Tom Stellard6b7d99d2012-12-19 22:10:31 +000019#include "llvm/ADT/SCCIterator.h"
Tom Stellard6b7d99d2012-12-19 22:10:31 +000020#include "llvm/Analysis/RegionInfo.h"
Chandler Carruth58a2cbe2013-01-02 10:22:59 +000021#include "llvm/Analysis/RegionIterator.h"
Tom Stellard6b7d99d2012-12-19 22:10:31 +000022#include "llvm/Analysis/RegionPass.h"
Chandler Carruth0b8c9a82013-01-02 11:36:10 +000023#include "llvm/IR/Module.h"
Tom Stellard6b7d99d2012-12-19 22:10:31 +000024#include "llvm/Transforms/Utils/SSAUpdater.h"
25
26using namespace llvm;
27
28namespace {
29
30// Definition of the complex types used in this pass.
31
32typedef std::pair<BasicBlock *, Value *> BBValuePair;
Tom Stellard6b7d99d2012-12-19 22:10:31 +000033
34typedef SmallVector<RegionNode*, 8> RNVector;
35typedef SmallVector<BasicBlock*, 8> BBVector;
Tom Stellard27f5d062013-02-08 22:24:37 +000036typedef SmallVector<BranchInst*, 8> BranchVector;
Tom Stellard6b7d99d2012-12-19 22:10:31 +000037typedef SmallVector<BBValuePair, 2> BBValueVector;
38
Tom Stellard27f5d062013-02-08 22:24:37 +000039typedef SmallPtrSet<BasicBlock *, 8> BBSet;
40
Tom Stellard6b7d99d2012-12-19 22:10:31 +000041typedef DenseMap<PHINode *, BBValueVector> PhiMap;
Christian Konigf0e469b2013-02-16 11:27:29 +000042typedef DenseMap<DomTreeNode *, unsigned> DTN2UnsignedMap;
Tom Stellard6b7d99d2012-12-19 22:10:31 +000043typedef DenseMap<BasicBlock *, PhiMap> BBPhiMap;
44typedef DenseMap<BasicBlock *, Value *> BBPredicates;
45typedef DenseMap<BasicBlock *, BBPredicates> PredMap;
Tom Stellard13cf6cb2013-02-08 22:24:35 +000046typedef DenseMap<BasicBlock *, BBVector> BB2BBVecMap;
Tom Stellard6b7d99d2012-12-19 22:10:31 +000047
48// The name for newly created blocks.
49
50static const char *FlowBlockName = "Flow";
51
Christian Konigf0e469b2013-02-16 11:27:29 +000052/// @brief Find the nearest common dominator for multiple BasicBlocks
53///
54/// Helper class for AMDGPUStructurizeCFG
55/// TODO: Maybe move into common code
56class NearestCommonDominator {
57
58 DominatorTree *DT;
59
60 DTN2UnsignedMap IndexMap;
61
62 BasicBlock *Result;
63 unsigned ResultIndex;
64 bool ExplicitMentioned;
65
66public:
67 /// \brief Start a new query
68 NearestCommonDominator(DominatorTree *DomTree) {
69 DT = DomTree;
70 Result = 0;
71 }
72
73 /// \brief Add BB to the resulting dominator
74 void addBlock(BasicBlock *BB, bool Remember = true) {
75
76 DomTreeNode *Node = DT->getNode(BB);
77
78 if (Result == 0) {
79 unsigned Numbering = 0;
80 for (;Node;Node = Node->getIDom())
81 IndexMap[Node] = ++Numbering;
82 Result = BB;
83 ResultIndex = 1;
84 ExplicitMentioned = Remember;
85 return;
86 }
87
88 for (;Node;Node = Node->getIDom())
89 if (IndexMap.count(Node))
90 break;
91 else
92 IndexMap[Node] = 0;
93
94 assert(Node && "Dominator tree invalid!");
95
96 unsigned Numbering = IndexMap[Node];
97 if (Numbering > ResultIndex) {
98 Result = Node->getBlock();
99 ResultIndex = Numbering;
100 ExplicitMentioned = Remember && (Result == BB);
101 } else if (Numbering == ResultIndex) {
102 ExplicitMentioned |= Remember;
103 }
104 }
105
106 /// \brief Is "Result" one of the BBs added with "Remember" = True?
107 bool wasResultExplicitMentioned() {
108 return ExplicitMentioned;
109 }
110
111 /// \brief Get the query result
112 BasicBlock *getResult() {
113 return Result;
114 }
115};
116
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000117/// @brief Transforms the control flow graph on one single entry/exit region
118/// at a time.
119///
120/// After the transform all "If"/"Then"/"Else" style control flow looks like
121/// this:
122///
123/// \verbatim
124/// 1
125/// ||
126/// | |
127/// 2 |
128/// | /
129/// |/
130/// 3
131/// || Where:
132/// | | 1 = "If" block, calculates the condition
133/// 4 | 2 = "Then" subregion, runs if the condition is true
134/// | / 3 = "Flow" blocks, newly inserted flow blocks, rejoins the flow
135/// |/ 4 = "Else" optional subregion, runs if the condition is false
136/// 5 5 = "End" block, also rejoins the control flow
137/// \endverbatim
138///
139/// Control flow is expressed as a branch where the true exit goes into the
140/// "Then"/"Else" region, while the false exit skips the region
141/// The condition for the optional "Else" region is expressed as a PHI node.
142/// The incomming values of the PHI node are true for the "If" edge and false
143/// for the "Then" edge.
144///
145/// Additionally to that even complicated loops look like this:
146///
147/// \verbatim
148/// 1
149/// ||
150/// | |
151/// 2 ^ Where:
152/// | / 1 = "Entry" block
153/// |/ 2 = "Loop" optional subregion, with all exits at "Flow" block
154/// 3 3 = "Flow" block, with back edge to entry block
155/// |
156/// \endverbatim
157///
158/// The back edge of the "Flow" block is always on the false side of the branch
159/// while the true side continues the general flow. So the loop condition
160/// consist of a network of PHI nodes where the true incoming values expresses
161/// breaks and the false values expresses continue states.
162class AMDGPUStructurizeCFG : public RegionPass {
163
164 static char ID;
165
166 Type *Boolean;
167 ConstantInt *BoolTrue;
168 ConstantInt *BoolFalse;
169 UndefValue *BoolUndef;
170
171 Function *Func;
172 Region *ParentRegion;
173
174 DominatorTree *DT;
175
176 RNVector Order;
Tom Stellardf4e471a2013-02-08 22:24:38 +0000177 BBSet Visited;
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000178 PredMap Predicates;
179 BBPhiMap DeletedPhis;
Tom Stellard13cf6cb2013-02-08 22:24:35 +0000180 BB2BBVecMap AddedPhis;
Tom Stellard27f5d062013-02-08 22:24:37 +0000181 BranchVector Conditions;
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000182
183 BasicBlock *LoopStart;
184 BasicBlock *LoopEnd;
Tom Stellard27f5d062013-02-08 22:24:37 +0000185 BBSet LoopTargets;
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000186 BBPredicates LoopPred;
187
188 void orderNodes();
189
Tom Stellard27f5d062013-02-08 22:24:37 +0000190 Value *buildCondition(BranchInst *Term, unsigned Idx, bool Invert);
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000191
Tom Stellard27f5d062013-02-08 22:24:37 +0000192 bool analyzeLoopStart(BasicBlock *From, BasicBlock *To, Value *Condition);
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000193
Tom Stellard27f5d062013-02-08 22:24:37 +0000194 void analyzeNode(RegionNode *N);
195
196 void analyzeLoopEnd(RegionNode *N);
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000197
198 void collectInfos();
199
Tom Stellard27f5d062013-02-08 22:24:37 +0000200 void insertConditions();
201
Tom Stellard13cf6cb2013-02-08 22:24:35 +0000202 void delPhiValues(BasicBlock *From, BasicBlock *To);
203
204 void addPhiValues(BasicBlock *From, BasicBlock *To);
205
206 void setPhiValues();
207
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000208 void killTerminator(BasicBlock *BB);
209
Tom Stellardf4e471a2013-02-08 22:24:38 +0000210 void changeExit(RegionNode *Node, BasicBlock *NewExit,
211 bool IncludeDominator);
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000212
Tom Stellardf4e471a2013-02-08 22:24:38 +0000213 BasicBlock *getNextFlow(BasicBlock *Dominator);
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000214
Tom Stellardf4e471a2013-02-08 22:24:38 +0000215 BasicBlock *needPrefix(RegionNode *&Prev, RegionNode *Node);
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000216
Tom Stellardf4e471a2013-02-08 22:24:38 +0000217 BasicBlock *needPostfix(BasicBlock *Flow, bool ExitUseAllowed);
218
219 RegionNode *getNextPrev(BasicBlock *Next);
220
221 bool dominatesPredicates(BasicBlock *BB, RegionNode *Node);
222
223 bool isPredictableTrue(RegionNode *Who, RegionNode *Where);
224
225 RegionNode *wireFlow(RegionNode *&Prev, bool ExitUseAllowed);
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000226
227 void createFlow();
228
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000229 void rebuildSSA();
230
231public:
232 AMDGPUStructurizeCFG():
233 RegionPass(ID) {
234
235 initializeRegionInfoPass(*PassRegistry::getPassRegistry());
236 }
237
238 virtual bool doInitialization(Region *R, RGPassManager &RGM);
239
240 virtual bool runOnRegion(Region *R, RGPassManager &RGM);
241
242 virtual const char *getPassName() const {
243 return "AMDGPU simplify control flow";
244 }
245
246 void getAnalysisUsage(AnalysisUsage &AU) const {
247
248 AU.addRequired<DominatorTree>();
249 AU.addPreserved<DominatorTree>();
250 RegionPass::getAnalysisUsage(AU);
251 }
252
253};
254
255} // end anonymous namespace
256
257char AMDGPUStructurizeCFG::ID = 0;
258
259/// \brief Initialize the types and constants used in the pass
260bool AMDGPUStructurizeCFG::doInitialization(Region *R, RGPassManager &RGM) {
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000261 LLVMContext &Context = R->getEntry()->getContext();
262
263 Boolean = Type::getInt1Ty(Context);
264 BoolTrue = ConstantInt::getTrue(Context);
265 BoolFalse = ConstantInt::getFalse(Context);
266 BoolUndef = UndefValue::get(Boolean);
267
268 return false;
269}
270
271/// \brief Build up the general order of nodes
272void AMDGPUStructurizeCFG::orderNodes() {
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000273 scc_iterator<Region *> I = scc_begin(ParentRegion),
274 E = scc_end(ParentRegion);
275 for (Order.clear(); I != E; ++I) {
276 std::vector<RegionNode *> &Nodes = *I;
277 Order.append(Nodes.begin(), Nodes.end());
278 }
279}
280
Tom Stellard27f5d062013-02-08 22:24:37 +0000281/// \brief Build the condition for one edge
282Value *AMDGPUStructurizeCFG::buildCondition(BranchInst *Term, unsigned Idx,
283 bool Invert) {
284 Value *Cond = Invert ? BoolFalse : BoolTrue;
285 if (Term->isConditional()) {
286 Cond = Term->getCondition();
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000287
Tom Stellard27f5d062013-02-08 22:24:37 +0000288 if (Idx != Invert)
289 Cond = BinaryOperator::CreateNot(Cond, "", Term);
290 }
291 return Cond;
292}
293
294/// \brief Analyze the start of a loop and insert predicates as necessary
295bool AMDGPUStructurizeCFG::analyzeLoopStart(BasicBlock *From, BasicBlock *To,
296 Value *Condition) {
297 LoopPred[From] = Condition;
298 LoopTargets.insert(To);
299 if (!LoopStart) {
300 LoopStart = To;
301 return true;
302
303 } else if (LoopStart == To)
304 return true;
305
306 // We need to handle the case of intersecting loops, e. g.
307 //
308 // /----<-----
309 // | |
310 // -> A -> B -> C -> D
311 // | |
312 // -----<----/
313
314 RNVector::reverse_iterator OI = Order.rbegin(), OE = Order.rend();
315
316 for (;OI != OE; ++OI)
317 if ((*OI)->getEntry() == LoopStart)
318 break;
319
320 for (;OI != OE && (*OI)->getEntry() != To; ++OI) {
321 BBPredicates &Pred = Predicates[(*OI)->getEntry()];
322 if (!Pred.count(From))
323 Pred[From] = Condition;
324 }
325 return false;
326}
327
328/// \brief Analyze the predecessors of each block and build up predicates
329void AMDGPUStructurizeCFG::analyzeNode(RegionNode *N) {
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000330 RegionInfo *RI = ParentRegion->getRegionInfo();
Tom Stellard27f5d062013-02-08 22:24:37 +0000331 BasicBlock *BB = N->getEntry();
332 BBPredicates &Pred = Predicates[BB];
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000333
Tom Stellard27f5d062013-02-08 22:24:37 +0000334 for (pred_iterator PI = pred_begin(BB), PE = pred_end(BB);
335 PI != PE; ++PI) {
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000336
Tom Stellard27f5d062013-02-08 22:24:37 +0000337 if (!ParentRegion->contains(*PI)) {
338 // It's a branch from outside into our region entry
339 Pred[*PI] = BoolTrue;
340 continue;
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000341 }
342
Tom Stellard27f5d062013-02-08 22:24:37 +0000343 Region *R = RI->getRegionFor(*PI);
344 if (R == ParentRegion) {
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000345
Tom Stellard27f5d062013-02-08 22:24:37 +0000346 // It's a top level block in our region
347 BranchInst *Term = cast<BranchInst>((*PI)->getTerminator());
348 for (unsigned i = 0, e = Term->getNumSuccessors(); i != e; ++i) {
349 BasicBlock *Succ = Term->getSuccessor(i);
350 if (Succ != BB)
351 continue;
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000352
Tom Stellard27f5d062013-02-08 22:24:37 +0000353 if (Visited.count(*PI)) {
354 // Normal forward edge
355 if (Term->isConditional()) {
356 // Try to treat it like an ELSE block
357 BasicBlock *Other = Term->getSuccessor(!i);
358 if (Visited.count(Other) && !LoopTargets.count(Other) &&
359 !Pred.count(Other) && !Pred.count(*PI)) {
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000360
Tom Stellard27f5d062013-02-08 22:24:37 +0000361 Pred[Other] = BoolFalse;
362 Pred[*PI] = BoolTrue;
363 continue;
364 }
365 }
366
367 } else {
368 // Back edge
369 if (analyzeLoopStart(*PI, BB, buildCondition(Term, i, true)))
370 continue;
371 }
372 Pred[*PI] = buildCondition(Term, i, false);
373 }
374
375 } else {
376
377 // It's an exit from a sub region
378 while(R->getParent() != ParentRegion)
379 R = R->getParent();
380
381 // Edge from inside a subregion to its entry, ignore it
382 if (R == N)
383 continue;
384
385 BasicBlock *Entry = R->getEntry();
386 if (!Visited.count(Entry))
387 if (analyzeLoopStart(Entry, BB, BoolFalse))
388 continue;
389
390 Pred[Entry] = BoolTrue;
391 }
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000392 }
393}
394
Tom Stellard27f5d062013-02-08 22:24:37 +0000395/// \brief Determine the end of the loop
396void AMDGPUStructurizeCFG::analyzeLoopEnd(RegionNode *N) {
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000397
Tom Stellard27f5d062013-02-08 22:24:37 +0000398 if (N->isSubRegion()) {
399 // Test for exit as back edge
400 BasicBlock *Exit = N->getNodeAs<Region>()->getExit();
401 if (Visited.count(Exit))
402 LoopEnd = N->getEntry();
403
404 } else {
405 // Test for sucessors as back edge
406 BasicBlock *BB = N->getNodeAs<BasicBlock>();
407 BranchInst *Term = cast<BranchInst>(BB->getTerminator());
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000408
409 for (unsigned i = 0, e = Term->getNumSuccessors(); i != e; ++i) {
410 BasicBlock *Succ = Term->getSuccessor(i);
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000411
Tom Stellard27f5d062013-02-08 22:24:37 +0000412 if (Visited.count(Succ))
413 LoopEnd = BB;
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000414 }
415 }
416}
417
418/// \brief Collect various loop and predicate infos
419void AMDGPUStructurizeCFG::collectInfos() {
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000420
421 // Reset predicate
422 Predicates.clear();
423
424 // and loop infos
425 LoopStart = LoopEnd = 0;
Tom Stellard27f5d062013-02-08 22:24:37 +0000426 LoopTargets.clear();
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000427 LoopPred.clear();
428
Tom Stellard27f5d062013-02-08 22:24:37 +0000429 // Reset the visited nodes
430 Visited.clear();
431
432 for (RNVector::reverse_iterator OI = Order.rbegin(), OE = Order.rend();
433 OI != OE; ++OI) {
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000434
435 // Analyze all the conditions leading to a node
Tom Stellard27f5d062013-02-08 22:24:37 +0000436 analyzeNode(*OI);
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000437
Tom Stellard27f5d062013-02-08 22:24:37 +0000438 // Remember that we've seen this node
Tom Stellardf4e471a2013-02-08 22:24:38 +0000439 Visited.insert((*OI)->getEntry());
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000440
Tom Stellard27f5d062013-02-08 22:24:37 +0000441 // Find the last back edge
442 analyzeLoopEnd(*OI);
443 }
444
445 // Both or neither must be set
446 assert(!LoopStart == !LoopEnd);
447}
448
449/// \brief Insert the missing branch conditions
450void AMDGPUStructurizeCFG::insertConditions() {
451 SSAUpdater PhiInserter;
452
453 for (BranchVector::iterator I = Conditions.begin(),
454 E = Conditions.end(); I != E; ++I) {
455
456 BranchInst *Term = *I;
457 BasicBlock *Parent = Term->getParent();
458
459 assert(Term->isConditional());
460
461 PhiInserter.Initialize(Boolean, "");
462 if (Parent == LoopEnd) {
463 PhiInserter.AddAvailableValue(LoopStart, BoolTrue);
464 } else {
465 PhiInserter.AddAvailableValue(&Func->getEntryBlock(), BoolFalse);
466 PhiInserter.AddAvailableValue(Parent, BoolFalse);
467 }
468
469 bool ParentHasValue = false;
470 BasicBlock *Succ = Term->getSuccessor(0);
471 BBPredicates &Preds = (Parent == LoopEnd) ? LoopPred : Predicates[Succ];
472 for (BBPredicates::iterator PI = Preds.begin(), PE = Preds.end();
473 PI != PE; ++PI) {
474
475 PhiInserter.AddAvailableValue(PI->first, PI->second);
476 ParentHasValue |= PI->first == Parent;
477 }
478
479 if (ParentHasValue)
480 Term->setCondition(PhiInserter.GetValueAtEndOfBlock(Parent));
481 else
482 Term->setCondition(PhiInserter.GetValueInMiddleOfBlock(Parent));
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000483 }
484}
485
Tom Stellard13cf6cb2013-02-08 22:24:35 +0000486/// \brief Remove all PHI values coming from "From" into "To" and remember
487/// them in DeletedPhis
488void AMDGPUStructurizeCFG::delPhiValues(BasicBlock *From, BasicBlock *To) {
489 PhiMap &Map = DeletedPhis[To];
490 for (BasicBlock::iterator I = To->begin(), E = To->end();
491 I != E && isa<PHINode>(*I);) {
492
493 PHINode &Phi = cast<PHINode>(*I++);
494 while (Phi.getBasicBlockIndex(From) != -1) {
495 Value *Deleted = Phi.removeIncomingValue(From, false);
496 Map[&Phi].push_back(std::make_pair(From, Deleted));
497 }
498 }
499}
500
501/// \brief Add a dummy PHI value as soon as we knew the new predecessor
502void AMDGPUStructurizeCFG::addPhiValues(BasicBlock *From, BasicBlock *To) {
503 for (BasicBlock::iterator I = To->begin(), E = To->end();
504 I != E && isa<PHINode>(*I);) {
505
506 PHINode &Phi = cast<PHINode>(*I++);
507 Value *Undef = UndefValue::get(Phi.getType());
508 Phi.addIncoming(Undef, From);
509 }
510 AddedPhis[To].push_back(From);
511}
512
513/// \brief Add the real PHI value as soon as everything is set up
514void AMDGPUStructurizeCFG::setPhiValues() {
515
516 SSAUpdater Updater;
517 for (BB2BBVecMap::iterator AI = AddedPhis.begin(), AE = AddedPhis.end();
518 AI != AE; ++AI) {
519
520 BasicBlock *To = AI->first;
521 BBVector &From = AI->second;
522
523 if (!DeletedPhis.count(To))
524 continue;
525
526 PhiMap &Map = DeletedPhis[To];
527 for (PhiMap::iterator PI = Map.begin(), PE = Map.end();
528 PI != PE; ++PI) {
529
530 PHINode *Phi = PI->first;
531 Value *Undef = UndefValue::get(Phi->getType());
532 Updater.Initialize(Phi->getType(), "");
533 Updater.AddAvailableValue(&Func->getEntryBlock(), Undef);
534 Updater.AddAvailableValue(To, Undef);
535
Christian Konig4c79c712013-02-16 11:27:35 +0000536 NearestCommonDominator Dominator(DT);
537 Dominator.addBlock(To, false);
Tom Stellard13cf6cb2013-02-08 22:24:35 +0000538 for (BBValueVector::iterator VI = PI->second.begin(),
539 VE = PI->second.end(); VI != VE; ++VI) {
540
541 Updater.AddAvailableValue(VI->first, VI->second);
Christian Konig4c79c712013-02-16 11:27:35 +0000542 Dominator.addBlock(VI->first);
Tom Stellard13cf6cb2013-02-08 22:24:35 +0000543 }
544
Christian Konig4c79c712013-02-16 11:27:35 +0000545 if (!Dominator.wasResultExplicitMentioned())
546 Updater.AddAvailableValue(Dominator.getResult(), Undef);
547
Tom Stellard13cf6cb2013-02-08 22:24:35 +0000548 for (BBVector::iterator FI = From.begin(), FE = From.end();
549 FI != FE; ++FI) {
550
551 int Idx = Phi->getBasicBlockIndex(*FI);
552 assert(Idx != -1);
553 Phi->setIncomingValue(Idx, Updater.GetValueAtEndOfBlock(*FI));
554 }
555 }
556
557 DeletedPhis.erase(To);
558 }
559 assert(DeletedPhis.empty());
560}
561
Tom Stellardf4e471a2013-02-08 22:24:38 +0000562/// \brief Remove phi values from all successors and then remove the terminator.
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000563void AMDGPUStructurizeCFG::killTerminator(BasicBlock *BB) {
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000564 TerminatorInst *Term = BB->getTerminator();
565 if (!Term)
566 return;
567
568 for (succ_iterator SI = succ_begin(BB), SE = succ_end(BB);
569 SI != SE; ++SI) {
570
571 delPhiValues(BB, *SI);
572 }
573
574 Term->eraseFromParent();
575}
576
Tom Stellardf4e471a2013-02-08 22:24:38 +0000577/// \brief Let node exit(s) point to NewExit
578void AMDGPUStructurizeCFG::changeExit(RegionNode *Node, BasicBlock *NewExit,
579 bool IncludeDominator) {
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000580
Tom Stellardf4e471a2013-02-08 22:24:38 +0000581 if (Node->isSubRegion()) {
582 Region *SubRegion = Node->getNodeAs<Region>();
583 BasicBlock *OldExit = SubRegion->getExit();
584 BasicBlock *Dominator = 0;
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000585
Tom Stellardf4e471a2013-02-08 22:24:38 +0000586 // Find all the edges from the sub region to the exit
587 for (pred_iterator I = pred_begin(OldExit), E = pred_end(OldExit);
588 I != E;) {
589
590 BasicBlock *BB = *I++;
591 if (!SubRegion->contains(BB))
592 continue;
593
594 // Modify the edges to point to the new exit
595 delPhiValues(BB, OldExit);
596 BB->getTerminator()->replaceUsesOfWith(OldExit, NewExit);
597 addPhiValues(BB, NewExit);
598
599 // Find the new dominator (if requested)
600 if (IncludeDominator) {
601 if (!Dominator)
602 Dominator = BB;
603 else
604 Dominator = DT->findNearestCommonDominator(Dominator, BB);
605 }
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000606 }
607
Tom Stellardf4e471a2013-02-08 22:24:38 +0000608 // Change the dominator (if requested)
609 if (Dominator)
610 DT->changeImmediateDominator(NewExit, Dominator);
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000611
Tom Stellardf4e471a2013-02-08 22:24:38 +0000612 // Update the region info
613 SubRegion->replaceExit(NewExit);
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000614
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000615 } else {
Tom Stellardf4e471a2013-02-08 22:24:38 +0000616 BasicBlock *BB = Node->getNodeAs<BasicBlock>();
617 killTerminator(BB);
618 BranchInst::Create(NewExit, BB);
619 addPhiValues(BB, NewExit);
620 if (IncludeDominator)
621 DT->changeImmediateDominator(NewExit, BB);
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000622 }
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000623}
624
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000625/// \brief Create a new flow node and update dominator tree and region info
Tom Stellardf4e471a2013-02-08 22:24:38 +0000626BasicBlock *AMDGPUStructurizeCFG::getNextFlow(BasicBlock *Dominator) {
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000627 LLVMContext &Context = Func->getContext();
628 BasicBlock *Insert = Order.empty() ? ParentRegion->getExit() :
629 Order.back()->getEntry();
630 BasicBlock *Flow = BasicBlock::Create(Context, FlowBlockName,
631 Func, Insert);
Tom Stellardf4e471a2013-02-08 22:24:38 +0000632 DT->addNewBlock(Flow, Dominator);
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000633 ParentRegion->getRegionInfo()->setRegionFor(Flow, ParentRegion);
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000634 return Flow;
635}
636
Tom Stellardf4e471a2013-02-08 22:24:38 +0000637/// \brief Create a new or reuse the previous node as flow node
638BasicBlock *AMDGPUStructurizeCFG::needPrefix(RegionNode *&Prev,
639 RegionNode *Node) {
640
641 if (!Prev || Prev->isSubRegion() ||
642 (Node && Node->getEntry() == LoopStart)) {
643
644 // We need to insert a flow node, first figure out the dominator
645 DomTreeNode *Dominator = Prev ? DT->getNode(Prev->getEntry()) : 0;
646 if (!Dominator)
647 Dominator = DT->getNode(Node->getEntry())->getIDom();
648 assert(Dominator && "Illegal loop to function entry");
649
650 // then create the flow node
651 BasicBlock *Flow = getNextFlow(Dominator->getBlock());
652
653 // wire up the new flow
654 if (Prev) {
655 changeExit(Prev, Flow, true);
656 } else {
657 // Parent regions entry needs predicates, create a new region entry
658 BasicBlock *Entry = Node->getEntry();
659 for (pred_iterator I = pred_begin(Entry), E = pred_end(Entry);
660 I != E;) {
661
662 BasicBlock *BB = *(I++);
663 if (ParentRegion->contains(BB))
664 continue;
665
666 // Remove PHY values from outside to our entry node
667 delPhiValues(BB, Entry);
668
669 // Update the branch instructions
670 BB->getTerminator()->replaceUsesOfWith(Entry, Flow);
671 }
672
673 // Populate the region tree with the new entry
674 for (Region *R = ParentRegion; R && R->getEntry() == Entry;
675 R = R->getParent()) {
676 R->replaceEntry(Flow);
677 }
678 }
679 Prev = ParentRegion->getBBNode(Flow);
680
681 } else {
682 killTerminator(Prev->getEntry());
683 }
684
685 return Prev->getEntry();
686}
687
688/// \brief Returns the region exit if possible, otherwise just a new flow node
689BasicBlock *AMDGPUStructurizeCFG::needPostfix(BasicBlock *Flow,
690 bool ExitUseAllowed) {
691
692 if (Order.empty() && ExitUseAllowed) {
693 BasicBlock *Exit = ParentRegion->getExit();
694 DT->changeImmediateDominator(Exit, Flow);
695 addPhiValues(Flow, Exit);
696 return Exit;
697 }
698 return getNextFlow(Flow);
699}
700
701/// \brief Returns the region node for Netx, or null if Next is the exit
702RegionNode *AMDGPUStructurizeCFG::getNextPrev(BasicBlock *Next) {
703 return ParentRegion->contains(Next) ? ParentRegion->getBBNode(Next) : 0;
704}
705
706/// \brief Does BB dominate all the predicates of Node ?
707bool AMDGPUStructurizeCFG::dominatesPredicates(BasicBlock *BB, RegionNode *Node) {
708 BBPredicates &Preds = Predicates[Node->getEntry()];
709 for (BBPredicates::iterator PI = Preds.begin(), PE = Preds.end();
710 PI != PE; ++PI) {
711
712 if (!DT->dominates(BB, PI->first))
713 return false;
714 }
715 return true;
716}
717
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000718/// \brief Can we predict that this node will always be called?
Tom Stellardf4e471a2013-02-08 22:24:38 +0000719bool AMDGPUStructurizeCFG::isPredictableTrue(RegionNode *Who,
720 RegionNode *Where) {
721
722 BBPredicates &Preds = Predicates[Who->getEntry()];
723 bool Dominated = Where == 0;
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000724
725 for (BBPredicates::iterator I = Preds.begin(), E = Preds.end();
726 I != E; ++I) {
727
728 if (I->second != BoolTrue)
729 return false;
730
Tom Stellardf4e471a2013-02-08 22:24:38 +0000731 if (!Dominated && DT->dominates(I->first, Where->getEntry()))
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000732 Dominated = true;
733 }
Tom Stellardf4e471a2013-02-08 22:24:38 +0000734
735 // TODO: The dominator check is too strict
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000736 return Dominated;
737}
738
Tom Stellardf4e471a2013-02-08 22:24:38 +0000739/// Take one node from the order vector and wire it up
740RegionNode *AMDGPUStructurizeCFG::wireFlow(RegionNode *&Prev,
741 bool ExitUseAllowed) {
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000742
Tom Stellardf4e471a2013-02-08 22:24:38 +0000743 RegionNode *Node = Order.pop_back_val();
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000744
Tom Stellardf4e471a2013-02-08 22:24:38 +0000745 if (isPredictableTrue(Node, Prev)) {
746 // Just a linear flow
747 if (Prev) {
748 changeExit(Prev, Node->getEntry(), true);
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000749 }
Tom Stellardf4e471a2013-02-08 22:24:38 +0000750 Prev = Node;
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000751
752 } else {
Tom Stellardf4e471a2013-02-08 22:24:38 +0000753 // Insert extra prefix node (or reuse last one)
754 BasicBlock *Flow = needPrefix(Prev, Node);
755 if (Node->getEntry() == LoopStart)
756 LoopStart = Flow;
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000757
Tom Stellardf4e471a2013-02-08 22:24:38 +0000758 // Insert extra postfix node (or use exit instead)
759 BasicBlock *Entry = Node->getEntry();
760 BasicBlock *Next = needPostfix(Flow, ExitUseAllowed && Entry != LoopEnd);
761
762 // let it point to entry and next block
763 Conditions.push_back(BranchInst::Create(Entry, Next, BoolUndef, Flow));
764 addPhiValues(Flow, Entry);
765 DT->changeImmediateDominator(Entry, Flow);
766
767 Prev = Node;
768 while (!Order.empty() && Node->getEntry() != LoopEnd &&
769 !LoopTargets.count(Order.back()->getEntry()) &&
770 dominatesPredicates(Entry, Order.back())) {
771 Node = wireFlow(Prev, false);
772 }
773
774 changeExit(Prev, Next, false);
775 Prev = getNextPrev(Next);
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000776 }
777
Tom Stellardf4e471a2013-02-08 22:24:38 +0000778 return Node;
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000779}
780
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000781/// After this function control flow looks like it should be, but
Tom Stellardf4e471a2013-02-08 22:24:38 +0000782/// branches and PHI nodes only have undefined conditions.
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000783void AMDGPUStructurizeCFG::createFlow() {
Tom Stellardf4e471a2013-02-08 22:24:38 +0000784
785 BasicBlock *Exit = ParentRegion->getExit();
786 bool EntryDominatesExit = DT->dominates(ParentRegion->getEntry(), Exit);
787
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000788 DeletedPhis.clear();
Tom Stellard13cf6cb2013-02-08 22:24:35 +0000789 AddedPhis.clear();
Tom Stellardf4e471a2013-02-08 22:24:38 +0000790 Conditions.clear();
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000791
Tom Stellardf4e471a2013-02-08 22:24:38 +0000792 RegionNode *Prev = 0;
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000793 while (!Order.empty()) {
Tom Stellardf4e471a2013-02-08 22:24:38 +0000794
795 RegionNode *Node = wireFlow(Prev, EntryDominatesExit);
796
797 // Create an extra loop end node
798 if (Node->getEntry() == LoopEnd) {
799 LoopEnd = needPrefix(Prev, 0);
800 BasicBlock *Next = needPostfix(LoopEnd, EntryDominatesExit);
801
802 Conditions.push_back(BranchInst::Create(Next, LoopStart,
Tom Stellard27f5d062013-02-08 22:24:37 +0000803 BoolUndef, LoopEnd));
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000804 addPhiValues(LoopEnd, LoopStart);
Tom Stellardf4e471a2013-02-08 22:24:38 +0000805 Prev = getNextPrev(Next);
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000806 }
807 }
808
Tom Stellardf4e471a2013-02-08 22:24:38 +0000809 if (Prev)
810 changeExit(Prev, Exit, EntryDominatesExit);
811 else
812 assert(EntryDominatesExit);
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000813}
814
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000815/// Handle a rare case where the disintegrated nodes instructions
816/// no longer dominate all their uses. Not sure if this is really nessasary
817void AMDGPUStructurizeCFG::rebuildSSA() {
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000818 SSAUpdater Updater;
819 for (Region::block_iterator I = ParentRegion->block_begin(),
820 E = ParentRegion->block_end();
821 I != E; ++I) {
822
823 BasicBlock *BB = *I;
824 for (BasicBlock::iterator II = BB->begin(), IE = BB->end();
825 II != IE; ++II) {
826
827 bool Initialized = false;
828 for (Use *I = &II->use_begin().getUse(), *Next; I; I = Next) {
829
830 Next = I->getNext();
831
832 Instruction *User = cast<Instruction>(I->getUser());
833 if (User->getParent() == BB) {
834 continue;
835
836 } else if (PHINode *UserPN = dyn_cast<PHINode>(User)) {
837 if (UserPN->getIncomingBlock(*I) == BB)
838 continue;
839 }
840
841 if (DT->dominates(II, User))
842 continue;
843
844 if (!Initialized) {
845 Value *Undef = UndefValue::get(II->getType());
846 Updater.Initialize(II->getType(), "");
847 Updater.AddAvailableValue(&Func->getEntryBlock(), Undef);
848 Updater.AddAvailableValue(BB, II);
849 Initialized = true;
850 }
851 Updater.RewriteUseAfterInsertions(*I);
852 }
853 }
854 }
855}
856
857/// \brief Run the transformation for each region found
858bool AMDGPUStructurizeCFG::runOnRegion(Region *R, RGPassManager &RGM) {
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000859 if (R->isTopLevelRegion())
860 return false;
861
862 Func = R->getEntry()->getParent();
863 ParentRegion = R;
864
865 DT = &getAnalysis<DominatorTree>();
866
867 orderNodes();
868 collectInfos();
869 createFlow();
870 insertConditions();
Tom Stellard13cf6cb2013-02-08 22:24:35 +0000871 setPhiValues();
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000872 rebuildSSA();
873
Tom Stellard27f5d062013-02-08 22:24:37 +0000874 // Cleanup
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000875 Order.clear();
876 Visited.clear();
877 Predicates.clear();
878 DeletedPhis.clear();
Tom Stellard13cf6cb2013-02-08 22:24:35 +0000879 AddedPhis.clear();
Tom Stellard27f5d062013-02-08 22:24:37 +0000880 Conditions.clear();
881 LoopTargets.clear();
882 LoopPred.clear();
Tom Stellard6b7d99d2012-12-19 22:10:31 +0000883
884 return true;
885}
886
887/// \brief Create the pass
888Pass *llvm::createAMDGPUStructurizeCFGPass() {
889 return new AMDGPUStructurizeCFG();
890}