blob: ab492f40bc2e10f2288efbafe795a23cb2faadf9 [file] [log] [blame]
Evan Chengd38c22b2006-05-11 23:55:42 +00001//===----- ScheduleDAGList.cpp - Reg pressure reduction list scheduler ----===//
2//
3// The LLVM Compiler Infrastructure
4//
Chris Lattnerf3ebc3f2007-12-29 20:36:04 +00005// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
Evan Chengd38c22b2006-05-11 23:55:42 +00007//
8//===----------------------------------------------------------------------===//
9//
10// This implements bottom-up and top-down register pressure reduction list
11// schedulers, using standard algorithms. The basic approach uses a priority
12// queue of available nodes to schedule. One at a time, nodes are taken from
13// the priority queue (thus in priority order), checked for legality to
14// schedule, and emitted if legal.
15//
16//===----------------------------------------------------------------------===//
17
Dale Johannesen2182f062007-07-13 17:13:54 +000018#define DEBUG_TYPE "pre-RA-sched"
Evan Chengd38c22b2006-05-11 23:55:42 +000019#include "llvm/CodeGen/ScheduleDAG.h"
Jim Laskey29e635d2006-08-02 12:30:23 +000020#include "llvm/CodeGen/SchedulerRegistry.h"
Dan Gohman3a4be0f2008-02-10 18:45:23 +000021#include "llvm/Target/TargetRegisterInfo.h"
Owen Anderson8c2c1e92006-05-12 06:33:49 +000022#include "llvm/Target/TargetData.h"
Evan Chengd38c22b2006-05-11 23:55:42 +000023#include "llvm/Target/TargetMachine.h"
24#include "llvm/Target/TargetInstrInfo.h"
25#include "llvm/Support/Debug.h"
Chris Lattner3d27be12006-08-27 12:54:02 +000026#include "llvm/Support/Compiler.h"
Evan Chenge6f92252007-09-27 18:46:06 +000027#include "llvm/ADT/SmallPtrSet.h"
Evan Cheng5924bf72007-09-25 01:54:36 +000028#include "llvm/ADT/SmallSet.h"
Evan Chengd38c22b2006-05-11 23:55:42 +000029#include "llvm/ADT/Statistic.h"
30#include <climits>
Evan Chengd38c22b2006-05-11 23:55:42 +000031#include <queue>
32#include "llvm/Support/CommandLine.h"
33using namespace llvm;
34
Dan Gohmanfd227e92008-03-25 17:10:29 +000035STATISTIC(NumBacktracks, "Number of times scheduler backtracked");
Evan Cheng79e97132007-10-05 01:39:18 +000036STATISTIC(NumUnfolds, "Number of nodes unfolded");
Evan Cheng1ec79b42007-09-27 07:09:03 +000037STATISTIC(NumDups, "Number of duplicated nodes");
38STATISTIC(NumCCCopies, "Number of cross class copies");
39
Jim Laskey95eda5b2006-08-01 14:21:23 +000040static RegisterScheduler
41 burrListDAGScheduler("list-burr",
42 " Bottom-up register reduction list scheduling",
43 createBURRListDAGScheduler);
44static RegisterScheduler
45 tdrListrDAGScheduler("list-tdrr",
46 " Top-down register reduction list scheduling",
47 createTDRRListDAGScheduler);
48
Evan Chengd38c22b2006-05-11 23:55:42 +000049namespace {
Evan Chengd38c22b2006-05-11 23:55:42 +000050//===----------------------------------------------------------------------===//
51/// ScheduleDAGRRList - The actual register reduction list scheduler
52/// implementation. This supports both top-down and bottom-up scheduling.
53///
Chris Lattnere097e6f2006-06-28 22:17:39 +000054class VISIBILITY_HIDDEN ScheduleDAGRRList : public ScheduleDAG {
Evan Chengd38c22b2006-05-11 23:55:42 +000055private:
56 /// isBottomUp - This is true if the scheduling problem is bottom-up, false if
57 /// it is top-down.
58 bool isBottomUp;
59
60 /// AvailableQueue - The priority queue to use for the available SUnits.
Evan Chengd38c22b2006-05-11 23:55:42 +000061 SchedulingPriorityQueue *AvailableQueue;
62
Evan Cheng5924bf72007-09-25 01:54:36 +000063 /// LiveRegs / LiveRegDefs - A set of physical registers and their definition
64 /// that are "live". These nodes must be scheduled before any other nodes that
65 /// modifies the registers can be scheduled.
66 SmallSet<unsigned, 4> LiveRegs;
67 std::vector<SUnit*> LiveRegDefs;
68 std::vector<unsigned> LiveRegCycles;
69
Evan Chengd38c22b2006-05-11 23:55:42 +000070public:
71 ScheduleDAGRRList(SelectionDAG &dag, MachineBasicBlock *bb,
72 const TargetMachine &tm, bool isbottomup,
73 SchedulingPriorityQueue *availqueue)
74 : ScheduleDAG(dag, bb, tm), isBottomUp(isbottomup),
75 AvailableQueue(availqueue) {
76 }
77
78 ~ScheduleDAGRRList() {
79 delete AvailableQueue;
80 }
81
82 void Schedule();
83
Roman Levenstein733a4d62008-03-26 11:23:38 +000084 /// IsReachable - Checks if SU is reachable from TargetSU.
Roman Levenstein7e71b4b2008-03-26 09:18:09 +000085 bool IsReachable(SUnit *SU, SUnit *TargetSU);
86
87 /// willCreateCycle - Returns true if adding an edge from SU to TargetSU will
88 /// create a cycle.
89 bool WillCreateCycle(SUnit *SU, SUnit *TargetSU);
90
91 /// AddPred - This adds the specified node X as a predecessor of
92 /// the current node Y if not already.
Roman Levenstein733a4d62008-03-26 11:23:38 +000093 /// This returns true if this is a new predecessor.
94 /// Updates the topological ordering if required.
Roman Levenstein7e71b4b2008-03-26 09:18:09 +000095 bool AddPred(SUnit *Y, SUnit *X, bool isCtrl, bool isSpecial,
Roman Levenstein733a4d62008-03-26 11:23:38 +000096 unsigned PhyReg = 0, int Cost = 1);
Roman Levenstein7e71b4b2008-03-26 09:18:09 +000097
Roman Levenstein733a4d62008-03-26 11:23:38 +000098 /// RemovePred - This removes the specified node N from the predecessors of
99 /// the current node M. Updates the topological ordering if required.
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000100 bool RemovePred(SUnit *M, SUnit *N, bool isCtrl, bool isSpecial);
101
Evan Chengd38c22b2006-05-11 23:55:42 +0000102private:
Evan Cheng8e136a92007-09-26 21:36:17 +0000103 void ReleasePred(SUnit*, bool, unsigned);
104 void ReleaseSucc(SUnit*, bool isChain, unsigned);
105 void CapturePred(SUnit*, SUnit*, bool);
106 void ScheduleNodeBottomUp(SUnit*, unsigned);
107 void ScheduleNodeTopDown(SUnit*, unsigned);
108 void UnscheduleNodeBottomUp(SUnit*);
109 void BacktrackBottomUp(SUnit*, unsigned, unsigned&);
110 SUnit *CopyAndMoveSuccessors(SUnit*);
Evan Cheng1ec79b42007-09-27 07:09:03 +0000111 void InsertCCCopiesAndMoveSuccs(SUnit*, unsigned,
Evan Cheng8e136a92007-09-26 21:36:17 +0000112 const TargetRegisterClass*,
Evan Cheng1ec79b42007-09-27 07:09:03 +0000113 const TargetRegisterClass*,
114 SmallVector<SUnit*, 2>&);
115 bool DelayForLiveRegsBottomUp(SUnit*, SmallVector<unsigned, 4>&);
Evan Chengd38c22b2006-05-11 23:55:42 +0000116 void ListScheduleTopDown();
117 void ListScheduleBottomUp();
Evan Chengafed73e2006-05-12 01:58:24 +0000118 void CommuteNodesToReducePressure();
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000119
120
121 /// CreateNewSUnit - Creates a new SUnit and returns a pointer to it.
Roman Levenstein733a4d62008-03-26 11:23:38 +0000122 /// Updates the topological ordering if required.
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000123 SUnit *CreateNewSUnit(SDNode *N) {
124 SUnit *NewNode = NewSUnit(N);
Roman Levenstein733a4d62008-03-26 11:23:38 +0000125 // Update the topological ordering.
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000126 if (NewNode->NodeNum >= Node2Index.size())
127 InitDAGTopologicalSorting();
128 return NewNode;
129 }
130
Roman Levenstein733a4d62008-03-26 11:23:38 +0000131 /// CreateClone - Creates a new SUnit from an existing one.
132 /// Updates the topological ordering if required.
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000133 SUnit *CreateClone(SUnit *N) {
134 SUnit *NewNode = Clone(N);
Roman Levenstein733a4d62008-03-26 11:23:38 +0000135 // Update the topological ordering.
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000136 if (NewNode->NodeNum >= Node2Index.size())
137 InitDAGTopologicalSorting();
138 return NewNode;
139 }
140
141 /// Functions for preserving the topological ordering
142 /// even after dynamic insertions of new edges.
Roman Levenstein733a4d62008-03-26 11:23:38 +0000143 /// This allows a very fast implementation of IsReachable.
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000144
145
146 /**
147 The idea of the algorithm is taken from
148 "Online algorithms for managing the topological order of
Roman Levenstein733a4d62008-03-26 11:23:38 +0000149 a directed acyclic graph" by David J. Pearce and Paul H.J. Kelly
150 This is the MNR algorithm, which was first introduced by
151 A. Marchetti-Spaccamela, U. Nanni and H. Rohnert in
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000152 "Maintaining a topological order under edge insertions".
153
154 Short description of the algorithm:
155
156 Topological ordering, ord, of a DAG maps each node to a topological
Roman Levenstein733a4d62008-03-26 11:23:38 +0000157 index so that for all edges X->Y it is the case that ord(X) < ord(Y).
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000158
159 This means that if there is a path from the node X to the node Z,
160 then ord(X) < ord(Z).
161
162 This property can be used to check for reachability of nodes:
163 if Z is reachable from X, then an insertion of the edge Z->X would
164 create a cycle.
165
Roman Levenstein733a4d62008-03-26 11:23:38 +0000166 The algorithm first computes a topological ordering for the DAG by initializing
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000167 the Index2Node and Node2Index arrays and then tries to keep the ordering
168 up-to-date after edge insertions by reordering the DAG.
169
170 On insertion of the edge X->Y, the algorithm first marks by calling DFS the
171 nodes reachable from Y, and then shifts them using Shift to lie immediately
172 after X in Index2Node.
173 */
174
Roman Levenstein733a4d62008-03-26 11:23:38 +0000175 /// InitDAGTopologicalSorting - create the initial topological
176 /// ordering from the DAG to be scheduled.
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000177 void InitDAGTopologicalSorting();
178
179 /// DFS - make a DFS traversal and mark all nodes affected by the
Roman Levenstein733a4d62008-03-26 11:23:38 +0000180 /// edge insertion. These nodes will later get new topological indexes
181 /// by means of the Shift method.
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000182 void DFS(SUnit *SU, int UpperBound, bool& HasLoop);
183
184 /// Shift - reassign topological indexes for the nodes in the DAG
Roman Levenstein733a4d62008-03-26 11:23:38 +0000185 /// to preserve the topological ordering.
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000186 void Shift(BitVector& Visited, int LowerBound, int UpperBound);
187
Roman Levenstein733a4d62008-03-26 11:23:38 +0000188 /// Allocate - assign the topological index to the node n.
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000189 void Allocate(int n, int index);
190
Roman Levenstein733a4d62008-03-26 11:23:38 +0000191 /// Index2Node - Maps topological index to the node number.
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000192 std::vector<int> Index2Node;
Roman Levenstein733a4d62008-03-26 11:23:38 +0000193 /// Node2Index - Maps the node number to its topological index.
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000194 std::vector<int> Node2Index;
Roman Levenstein733a4d62008-03-26 11:23:38 +0000195 /// Visited - a set of nodes visited during a DFS traversal.
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000196 BitVector Visited;
Evan Chengd38c22b2006-05-11 23:55:42 +0000197};
198} // end anonymous namespace
199
200
201/// Schedule - Schedule the DAG using list scheduling.
202void ScheduleDAGRRList::Schedule() {
Bill Wendling22e978a2006-12-07 20:04:42 +0000203 DOUT << "********** List Scheduling **********\n";
Evan Cheng5924bf72007-09-25 01:54:36 +0000204
Dan Gohman3a4be0f2008-02-10 18:45:23 +0000205 LiveRegDefs.resize(TRI->getNumRegs(), NULL);
206 LiveRegCycles.resize(TRI->getNumRegs(), 0);
Evan Cheng5924bf72007-09-25 01:54:36 +0000207
Evan Chengd38c22b2006-05-11 23:55:42 +0000208 // Build scheduling units.
209 BuildSchedUnits();
210
Evan Chengd38c22b2006-05-11 23:55:42 +0000211 DEBUG(for (unsigned su = 0, e = SUnits.size(); su != e; ++su)
Chris Lattnerd86418a2006-08-17 00:09:56 +0000212 SUnits[su].dumpAll(&DAG));
Evan Cheng47fbeda2006-10-14 08:34:06 +0000213 CalculateDepths();
214 CalculateHeights();
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000215 InitDAGTopologicalSorting();
Evan Chengd38c22b2006-05-11 23:55:42 +0000216
Evan Chengfd2c5dd2006-11-04 09:44:31 +0000217 AvailableQueue->initNodes(SUnitMap, SUnits);
Dan Gohman54a187e2007-08-20 19:28:38 +0000218
Evan Chengd38c22b2006-05-11 23:55:42 +0000219 // Execute the actual scheduling loop Top-Down or Bottom-Up as appropriate.
220 if (isBottomUp)
221 ListScheduleBottomUp();
222 else
223 ListScheduleTopDown();
224
225 AvailableQueue->releaseState();
Dan Gohman54a187e2007-08-20 19:28:38 +0000226
Evan Cheng009f5f52006-05-25 08:37:31 +0000227 CommuteNodesToReducePressure();
Evan Chengd38c22b2006-05-11 23:55:42 +0000228
Bill Wendling22e978a2006-12-07 20:04:42 +0000229 DOUT << "*** Final schedule ***\n";
Evan Chengd38c22b2006-05-11 23:55:42 +0000230 DEBUG(dumpSchedule());
Bill Wendling22e978a2006-12-07 20:04:42 +0000231 DOUT << "\n";
Evan Chengd38c22b2006-05-11 23:55:42 +0000232
233 // Emit in scheduled order
234 EmitSchedule();
235}
236
Evan Chengfd2c5dd2006-11-04 09:44:31 +0000237/// CommuteNodesToReducePressure - If a node is two-address and commutable, and
Evan Chengafed73e2006-05-12 01:58:24 +0000238/// it is not the last use of its first operand, add it to the CommuteSet if
239/// possible. It will be commuted when it is translated to a MI.
240void ScheduleDAGRRList::CommuteNodesToReducePressure() {
Evan Chenge3c44192007-06-22 01:35:51 +0000241 SmallPtrSet<SUnit*, 4> OperandSeen;
Dan Gohman4370f262008-04-15 01:22:18 +0000242 for (unsigned i = Sequence.size(); i != 0; ) {
243 --i;
Evan Chengafed73e2006-05-12 01:58:24 +0000244 SUnit *SU = Sequence[i];
Evan Cheng8e136a92007-09-26 21:36:17 +0000245 if (!SU || !SU->Node) continue;
Evan Chengfd2c5dd2006-11-04 09:44:31 +0000246 if (SU->isCommutable) {
247 unsigned Opc = SU->Node->getTargetOpcode();
Chris Lattner03ad8852008-01-07 07:27:27 +0000248 const TargetInstrDesc &TID = TII->get(Opc);
Chris Lattnerfd2e3382008-01-07 06:47:00 +0000249 unsigned NumRes = TID.getNumDefs();
Dan Gohman0340d1e2008-02-15 20:50:13 +0000250 unsigned NumOps = TID.getNumOperands() - NumRes;
Evan Chengfd2c5dd2006-11-04 09:44:31 +0000251 for (unsigned j = 0; j != NumOps; ++j) {
Chris Lattnerfd2e3382008-01-07 06:47:00 +0000252 if (TID.getOperandConstraint(j+NumRes, TOI::TIED_TO) == -1)
Evan Chengfd2c5dd2006-11-04 09:44:31 +0000253 continue;
254
255 SDNode *OpN = SU->Node->getOperand(j).Val;
Evan Cheng1bf166312007-11-09 01:27:11 +0000256 SUnit *OpSU = isPassiveNode(OpN) ? NULL : SUnitMap[OpN][SU->InstanceNo];
Evan Chengfd2c5dd2006-11-04 09:44:31 +0000257 if (OpSU && OperandSeen.count(OpSU) == 1) {
258 // Ok, so SU is not the last use of OpSU, but SU is two-address so
259 // it will clobber OpSU. Try to commute SU if no other source operands
260 // are live below.
261 bool DoCommute = true;
262 for (unsigned k = 0; k < NumOps; ++k) {
263 if (k != j) {
264 OpN = SU->Node->getOperand(k).Val;
Evan Cheng1bf166312007-11-09 01:27:11 +0000265 OpSU = isPassiveNode(OpN) ? NULL : SUnitMap[OpN][SU->InstanceNo];
Evan Chengfd2c5dd2006-11-04 09:44:31 +0000266 if (OpSU && OperandSeen.count(OpSU) == 1) {
267 DoCommute = false;
268 break;
269 }
270 }
Evan Chengafed73e2006-05-12 01:58:24 +0000271 }
Evan Chengfd2c5dd2006-11-04 09:44:31 +0000272 if (DoCommute)
273 CommuteSet.insert(SU->Node);
Evan Chengafed73e2006-05-12 01:58:24 +0000274 }
Evan Chengfd2c5dd2006-11-04 09:44:31 +0000275
276 // Only look at the first use&def node for now.
277 break;
Evan Chengafed73e2006-05-12 01:58:24 +0000278 }
279 }
280
Chris Lattnerd86418a2006-08-17 00:09:56 +0000281 for (SUnit::pred_iterator I = SU->Preds.begin(), E = SU->Preds.end();
282 I != E; ++I) {
Evan Cheng0effc3a2007-09-19 01:38:40 +0000283 if (!I->isCtrl)
284 OperandSeen.insert(I->Dep);
Evan Chengafed73e2006-05-12 01:58:24 +0000285 }
286 }
287}
Evan Chengd38c22b2006-05-11 23:55:42 +0000288
289//===----------------------------------------------------------------------===//
290// Bottom-Up Scheduling
291//===----------------------------------------------------------------------===//
292
Evan Chengd38c22b2006-05-11 23:55:42 +0000293/// ReleasePred - Decrement the NumSuccsLeft count of a predecessor. Add it to
Dan Gohman54a187e2007-08-20 19:28:38 +0000294/// the AvailableQueue if the count reaches zero. Also update its cycle bound.
Evan Chengd38c22b2006-05-11 23:55:42 +0000295void ScheduleDAGRRList::ReleasePred(SUnit *PredSU, bool isChain,
296 unsigned CurCycle) {
297 // FIXME: the distance between two nodes is not always == the predecessor's
298 // latency. For example, the reader can very well read the register written
299 // by the predecessor later than the issue cycle. It also depends on the
300 // interrupt model (drain vs. freeze).
301 PredSU->CycleBound = std::max(PredSU->CycleBound, CurCycle + PredSU->Latency);
302
Evan Cheng038dcc52007-09-28 19:24:24 +0000303 --PredSU->NumSuccsLeft;
Evan Chengd38c22b2006-05-11 23:55:42 +0000304
305#ifndef NDEBUG
Evan Cheng038dcc52007-09-28 19:24:24 +0000306 if (PredSU->NumSuccsLeft < 0) {
Bill Wendling22e978a2006-12-07 20:04:42 +0000307 cerr << "*** List scheduling failed! ***\n";
Evan Chengd38c22b2006-05-11 23:55:42 +0000308 PredSU->dump(&DAG);
Bill Wendling22e978a2006-12-07 20:04:42 +0000309 cerr << " has been released too many times!\n";
Evan Chengd38c22b2006-05-11 23:55:42 +0000310 assert(0);
311 }
312#endif
313
Evan Cheng038dcc52007-09-28 19:24:24 +0000314 if (PredSU->NumSuccsLeft == 0) {
Dan Gohman4370f262008-04-15 01:22:18 +0000315 PredSU->isAvailable = true;
316 AvailableQueue->push(PredSU);
Evan Chengd38c22b2006-05-11 23:55:42 +0000317 }
318}
319
320/// ScheduleNodeBottomUp - Add the node to the schedule. Decrement the pending
321/// count of its predecessors. If a predecessor pending count is zero, add it to
322/// the Available queue.
Evan Chengd12c97d2006-05-30 18:05:39 +0000323void ScheduleDAGRRList::ScheduleNodeBottomUp(SUnit *SU, unsigned CurCycle) {
Bill Wendling22e978a2006-12-07 20:04:42 +0000324 DOUT << "*** Scheduling [" << CurCycle << "]: ";
Evan Chengd38c22b2006-05-11 23:55:42 +0000325 DEBUG(SU->dump(&DAG));
326 SU->Cycle = CurCycle;
327
328 AvailableQueue->ScheduledNode(SU);
Evan Chengd38c22b2006-05-11 23:55:42 +0000329
330 // Bottom up: release predecessors
Chris Lattnerd86418a2006-08-17 00:09:56 +0000331 for (SUnit::pred_iterator I = SU->Preds.begin(), E = SU->Preds.end();
Evan Cheng5924bf72007-09-25 01:54:36 +0000332 I != E; ++I) {
Evan Cheng0effc3a2007-09-19 01:38:40 +0000333 ReleasePred(I->Dep, I->isCtrl, CurCycle);
Evan Cheng5924bf72007-09-25 01:54:36 +0000334 if (I->Cost < 0) {
335 // This is a physical register dependency and it's impossible or
336 // expensive to copy the register. Make sure nothing that can
337 // clobber the register is scheduled between the predecessor and
338 // this node.
339 if (LiveRegs.insert(I->Reg)) {
340 LiveRegDefs[I->Reg] = I->Dep;
341 LiveRegCycles[I->Reg] = CurCycle;
342 }
343 }
344 }
345
346 // Release all the implicit physical register defs that are live.
347 for (SUnit::succ_iterator I = SU->Succs.begin(), E = SU->Succs.end();
348 I != E; ++I) {
349 if (I->Cost < 0) {
350 if (LiveRegCycles[I->Reg] == I->Dep->Cycle) {
351 LiveRegs.erase(I->Reg);
352 assert(LiveRegDefs[I->Reg] == SU &&
353 "Physical register dependency violated?");
354 LiveRegDefs[I->Reg] = NULL;
355 LiveRegCycles[I->Reg] = 0;
356 }
357 }
358 }
359
Evan Chengd38c22b2006-05-11 23:55:42 +0000360 SU->isScheduled = true;
Evan Chengd38c22b2006-05-11 23:55:42 +0000361}
362
Evan Cheng5924bf72007-09-25 01:54:36 +0000363/// CapturePred - This does the opposite of ReleasePred. Since SU is being
364/// unscheduled, incrcease the succ left count of its predecessors. Remove
365/// them from AvailableQueue if necessary.
366void ScheduleDAGRRList::CapturePred(SUnit *PredSU, SUnit *SU, bool isChain) {
367 PredSU->CycleBound = 0;
368 for (SUnit::succ_iterator I = PredSU->Succs.begin(), E = PredSU->Succs.end();
369 I != E; ++I) {
370 if (I->Dep == SU)
371 continue;
372 PredSU->CycleBound = std::max(PredSU->CycleBound,
373 I->Dep->Cycle + PredSU->Latency);
374 }
375
376 if (PredSU->isAvailable) {
377 PredSU->isAvailable = false;
378 if (!PredSU->isPending)
379 AvailableQueue->remove(PredSU);
380 }
381
Evan Cheng038dcc52007-09-28 19:24:24 +0000382 ++PredSU->NumSuccsLeft;
Evan Cheng5924bf72007-09-25 01:54:36 +0000383}
384
385/// UnscheduleNodeBottomUp - Remove the node from the schedule, update its and
386/// its predecessor states to reflect the change.
387void ScheduleDAGRRList::UnscheduleNodeBottomUp(SUnit *SU) {
388 DOUT << "*** Unscheduling [" << SU->Cycle << "]: ";
389 DEBUG(SU->dump(&DAG));
390
391 AvailableQueue->UnscheduledNode(SU);
392
393 for (SUnit::pred_iterator I = SU->Preds.begin(), E = SU->Preds.end();
394 I != E; ++I) {
395 CapturePred(I->Dep, SU, I->isCtrl);
396 if (I->Cost < 0 && SU->Cycle == LiveRegCycles[I->Reg]) {
397 LiveRegs.erase(I->Reg);
398 assert(LiveRegDefs[I->Reg] == I->Dep &&
399 "Physical register dependency violated?");
400 LiveRegDefs[I->Reg] = NULL;
401 LiveRegCycles[I->Reg] = 0;
402 }
403 }
404
405 for (SUnit::succ_iterator I = SU->Succs.begin(), E = SU->Succs.end();
406 I != E; ++I) {
407 if (I->Cost < 0) {
408 if (LiveRegs.insert(I->Reg)) {
409 assert(!LiveRegDefs[I->Reg] &&
410 "Physical register dependency violated?");
411 LiveRegDefs[I->Reg] = SU;
412 }
413 if (I->Dep->Cycle < LiveRegCycles[I->Reg])
414 LiveRegCycles[I->Reg] = I->Dep->Cycle;
415 }
416 }
417
418 SU->Cycle = 0;
419 SU->isScheduled = false;
420 SU->isAvailable = true;
421 AvailableQueue->push(SU);
422}
423
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000424/// IsReachable - Checks if SU is reachable from TargetSU.
425bool ScheduleDAGRRList::IsReachable(SUnit *SU, SUnit *TargetSU) {
Roman Levenstein733a4d62008-03-26 11:23:38 +0000426 // If insertion of the edge SU->TargetSU would create a cycle
427 // then there is a path from TargetSU to SU.
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000428 int UpperBound, LowerBound;
429 LowerBound = Node2Index[TargetSU->NodeNum];
430 UpperBound = Node2Index[SU->NodeNum];
431 bool HasLoop = false;
432 // Is Ord(TargetSU) < Ord(SU) ?
433 if (LowerBound < UpperBound) {
434 Visited.reset();
435 // There may be a path from TargetSU to SU. Check for it.
436 DFS(TargetSU, UpperBound, HasLoop);
Evan Chengcfd5f822007-09-27 00:25:29 +0000437 }
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000438 return HasLoop;
Evan Chengcfd5f822007-09-27 00:25:29 +0000439}
440
Roman Levenstein733a4d62008-03-26 11:23:38 +0000441/// Allocate - assign the topological index to the node n.
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000442inline void ScheduleDAGRRList::Allocate(int n, int index) {
443 Node2Index[n] = index;
444 Index2Node[index] = n;
Evan Chengcfd5f822007-09-27 00:25:29 +0000445}
446
Roman Levenstein733a4d62008-03-26 11:23:38 +0000447/// InitDAGTopologicalSorting - create the initial topological
448/// ordering from the DAG to be scheduled.
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000449void ScheduleDAGRRList::InitDAGTopologicalSorting() {
450 unsigned DAGSize = SUnits.size();
451 std::vector<unsigned> InDegree(DAGSize);
452 std::vector<SUnit*> WorkList;
453 WorkList.reserve(DAGSize);
454 std::vector<SUnit*> TopOrder;
455 TopOrder.reserve(DAGSize);
456
Roman Levenstein733a4d62008-03-26 11:23:38 +0000457 // Initialize the data structures.
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000458 for (unsigned i = 0, e = DAGSize; i != e; ++i) {
459 SUnit *SU = &SUnits[i];
460 int NodeNum = SU->NodeNum;
461 unsigned Degree = SU->Succs.size();
462 InDegree[NodeNum] = Degree;
463
464 // Is it a node without dependencies?
465 if (Degree == 0) {
466 assert(SU->Succs.empty() && "SUnit should have no successors");
Roman Levenstein733a4d62008-03-26 11:23:38 +0000467 // Collect leaf nodes.
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000468 WorkList.push_back(SU);
469 }
470 }
471
472 while (!WorkList.empty()) {
473 SUnit *SU = WorkList.back();
474 WorkList.pop_back();
475 TopOrder.push_back(SU);
476 for (SUnit::const_pred_iterator I = SU->Preds.begin(), E = SU->Preds.end();
477 I != E; ++I) {
478 SUnit *SU = I->Dep;
479 if (!--InDegree[SU->NodeNum])
480 // If all dependencies of the node are processed already,
Roman Levenstein733a4d62008-03-26 11:23:38 +0000481 // then the node can be computed now.
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000482 WorkList.push_back(SU);
483 }
484 }
485
486 // Second pass, assign the actual topological order as node ids.
487 int Id = 0;
488
489 Index2Node.clear();
490 Node2Index.clear();
491 Index2Node.resize(DAGSize);
492 Node2Index.resize(DAGSize);
493 Visited.resize(DAGSize);
494
495 for (std::vector<SUnit*>::reverse_iterator TI = TopOrder.rbegin(),
496 TE = TopOrder.rend();TI != TE; ++TI) {
497 Allocate((*TI)->NodeNum, Id);
498 Id++;
499 }
500
501#ifndef NDEBUG
502 // Check correctness of the ordering
503 for (unsigned i = 0, e = DAGSize; i != e; ++i) {
504 SUnit *SU = &SUnits[i];
505 for (SUnit::const_pred_iterator I = SU->Preds.begin(), E = SU->Preds.end();
506 I != E; ++I) {
507 assert(Node2Index[SU->NodeNum] > Node2Index[I->Dep->NodeNum] &&
508 "Wrong topological sorting");
509 }
510 }
511#endif
512}
513
Roman Levenstein733a4d62008-03-26 11:23:38 +0000514/// AddPred - adds an edge from SUnit X to SUnit Y.
515/// Updates the topological ordering if required.
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000516bool ScheduleDAGRRList::AddPred(SUnit *Y, SUnit *X, bool isCtrl, bool isSpecial,
517 unsigned PhyReg, int Cost) {
518 int UpperBound, LowerBound;
519 LowerBound = Node2Index[Y->NodeNum];
520 UpperBound = Node2Index[X->NodeNum];
521 bool HasLoop = false;
522 // Is Ord(X) < Ord(Y) ?
523 if (LowerBound < UpperBound) {
Roman Levenstein733a4d62008-03-26 11:23:38 +0000524 // Update the topological order.
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000525 Visited.reset();
526 DFS(Y, UpperBound, HasLoop);
527 assert(!HasLoop && "Inserted edge creates a loop!");
Roman Levenstein733a4d62008-03-26 11:23:38 +0000528 // Recompute topological indexes.
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000529 Shift(Visited, LowerBound, UpperBound);
530 }
Roman Levenstein733a4d62008-03-26 11:23:38 +0000531 // Now really insert the edge.
532 return Y->addPred(X, isCtrl, isSpecial, PhyReg, Cost);
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000533}
534
Roman Levenstein733a4d62008-03-26 11:23:38 +0000535/// RemovePred - This removes the specified node N from the predecessors of
536/// the current node M. Updates the topological ordering if required.
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000537bool ScheduleDAGRRList::RemovePred(SUnit *M, SUnit *N,
538 bool isCtrl, bool isSpecial) {
539 // InitDAGTopologicalSorting();
540 return M->removePred(N, isCtrl, isSpecial);
541}
542
Roman Levenstein733a4d62008-03-26 11:23:38 +0000543/// DFS - Make a DFS traversal to mark all nodes reachable from SU and mark
544/// all nodes affected by the edge insertion. These nodes will later get new
545/// topological indexes by means of the Shift method.
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000546void ScheduleDAGRRList::DFS(SUnit *SU, int UpperBound, bool& HasLoop) {
547 std::vector<SUnit*> WorkList;
548 WorkList.reserve(SUnits.size());
549
550 WorkList.push_back(SU);
551 while (!WorkList.empty()) {
552 SU = WorkList.back();
553 WorkList.pop_back();
554 Visited.set(SU->NodeNum);
555 for (int I = SU->Succs.size()-1; I >= 0; --I) {
556 int s = SU->Succs[I].Dep->NodeNum;
557 if (Node2Index[s] == UpperBound) {
558 HasLoop = true;
559 return;
560 }
Roman Levenstein733a4d62008-03-26 11:23:38 +0000561 // Visit successors if not already and in affected region.
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000562 if (!Visited.test(s) && Node2Index[s] < UpperBound) {
563 WorkList.push_back(SU->Succs[I].Dep);
564 }
565 }
566 }
567}
568
Roman Levenstein733a4d62008-03-26 11:23:38 +0000569/// Shift - Renumber the nodes so that the topological ordering is
570/// preserved.
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000571void ScheduleDAGRRList::Shift(BitVector& Visited, int LowerBound,
572 int UpperBound) {
573 std::vector<int> L;
574 int shift = 0;
575 int i;
576
577 for (i = LowerBound; i <= UpperBound; ++i) {
Roman Levenstein733a4d62008-03-26 11:23:38 +0000578 // w is node at topological index i.
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000579 int w = Index2Node[i];
580 if (Visited.test(w)) {
Roman Levenstein733a4d62008-03-26 11:23:38 +0000581 // Unmark.
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000582 Visited.reset(w);
583 L.push_back(w);
584 shift = shift + 1;
585 } else {
586 Allocate(w, i - shift);
587 }
588 }
589
590 for (unsigned j = 0; j < L.size(); ++j) {
591 Allocate(L[j], i - shift);
592 i = i + 1;
593 }
594}
595
596
Dan Gohmanfd227e92008-03-25 17:10:29 +0000597/// WillCreateCycle - Returns true if adding an edge from SU to TargetSU will
Evan Chengcfd5f822007-09-27 00:25:29 +0000598/// create a cycle.
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000599bool ScheduleDAGRRList::WillCreateCycle(SUnit *SU, SUnit *TargetSU) {
600 if (IsReachable(TargetSU, SU))
Evan Chengcfd5f822007-09-27 00:25:29 +0000601 return true;
602 for (SUnit::pred_iterator I = SU->Preds.begin(), E = SU->Preds.end();
603 I != E; ++I)
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000604 if (I->Cost < 0 && IsReachable(TargetSU, I->Dep))
Evan Chengcfd5f822007-09-27 00:25:29 +0000605 return true;
606 return false;
607}
608
Evan Cheng8e136a92007-09-26 21:36:17 +0000609/// BacktrackBottomUp - Backtrack scheduling to a previous cycle specified in
Evan Cheng5924bf72007-09-25 01:54:36 +0000610/// BTCycle in order to schedule a specific node. Returns the last unscheduled
611/// SUnit. Also returns if a successor is unscheduled in the process.
Evan Cheng8e136a92007-09-26 21:36:17 +0000612void ScheduleDAGRRList::BacktrackBottomUp(SUnit *SU, unsigned BtCycle,
613 unsigned &CurCycle) {
Evan Cheng5924bf72007-09-25 01:54:36 +0000614 SUnit *OldSU = NULL;
Evan Cheng8e136a92007-09-26 21:36:17 +0000615 while (CurCycle > BtCycle) {
Evan Cheng5924bf72007-09-25 01:54:36 +0000616 OldSU = Sequence.back();
617 Sequence.pop_back();
618 if (SU->isSucc(OldSU))
Evan Cheng8e136a92007-09-26 21:36:17 +0000619 // Don't try to remove SU from AvailableQueue.
620 SU->isAvailable = false;
Evan Cheng5924bf72007-09-25 01:54:36 +0000621 UnscheduleNodeBottomUp(OldSU);
622 --CurCycle;
623 }
624
625
626 if (SU->isSucc(OldSU)) {
627 assert(false && "Something is wrong!");
628 abort();
629 }
Evan Cheng1ec79b42007-09-27 07:09:03 +0000630
631 ++NumBacktracks;
Evan Cheng5924bf72007-09-25 01:54:36 +0000632}
633
Evan Cheng5924bf72007-09-25 01:54:36 +0000634/// CopyAndMoveSuccessors - Clone the specified node and move its scheduled
635/// successors to the newly created node.
636SUnit *ScheduleDAGRRList::CopyAndMoveSuccessors(SUnit *SU) {
Evan Cheng79e97132007-10-05 01:39:18 +0000637 if (SU->FlaggedNodes.size())
638 return NULL;
Evan Cheng8e136a92007-09-26 21:36:17 +0000639
Evan Cheng79e97132007-10-05 01:39:18 +0000640 SDNode *N = SU->Node;
641 if (!N)
642 return NULL;
643
644 SUnit *NewSU;
Evan Cheng79e97132007-10-05 01:39:18 +0000645 bool TryUnfold = false;
Evan Cheng84d0ebc2007-10-05 01:42:35 +0000646 for (unsigned i = 0, e = N->getNumValues(); i != e; ++i) {
647 MVT::ValueType VT = N->getValueType(i);
648 if (VT == MVT::Flag)
649 return NULL;
650 else if (VT == MVT::Other)
651 TryUnfold = true;
652 }
Evan Cheng79e97132007-10-05 01:39:18 +0000653 for (unsigned i = 0, e = N->getNumOperands(); i != e; ++i) {
654 const SDOperand &Op = N->getOperand(i);
655 MVT::ValueType VT = Op.Val->getValueType(Op.ResNo);
656 if (VT == MVT::Flag)
657 return NULL;
Evan Cheng79e97132007-10-05 01:39:18 +0000658 }
659
660 if (TryUnfold) {
661 SmallVector<SDNode*, 4> NewNodes;
Owen Anderson0ec92e92008-01-07 01:35:56 +0000662 if (!TII->unfoldMemoryOperand(DAG, N, NewNodes))
Evan Cheng79e97132007-10-05 01:39:18 +0000663 return NULL;
664
665 DOUT << "Unfolding SU # " << SU->NodeNum << "\n";
666 assert(NewNodes.size() == 2 && "Expected a load folding node!");
667
668 N = NewNodes[1];
669 SDNode *LoadNode = NewNodes[0];
Evan Cheng79e97132007-10-05 01:39:18 +0000670 unsigned NumVals = N->getNumValues();
671 unsigned OldNumVals = SU->Node->getNumValues();
672 for (unsigned i = 0; i != NumVals; ++i)
Chris Lattner3cfb56d2007-10-15 06:10:22 +0000673 DAG.ReplaceAllUsesOfValueWith(SDOperand(SU->Node, i), SDOperand(N, i));
Evan Cheng79e97132007-10-05 01:39:18 +0000674 DAG.ReplaceAllUsesOfValueWith(SDOperand(SU->Node, OldNumVals-1),
Chris Lattner3cfb56d2007-10-15 06:10:22 +0000675 SDOperand(LoadNode, 1));
Evan Cheng79e97132007-10-05 01:39:18 +0000676
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000677 SUnit *NewSU = CreateNewSUnit(N);
Evan Cheng79e97132007-10-05 01:39:18 +0000678 SUnitMap[N].push_back(NewSU);
Chris Lattner03ad8852008-01-07 07:27:27 +0000679 const TargetInstrDesc &TID = TII->get(N->getTargetOpcode());
Dan Gohman856c0122008-02-16 00:25:40 +0000680 for (unsigned i = 0; i != TID.getNumOperands(); ++i) {
Chris Lattnerfd2e3382008-01-07 06:47:00 +0000681 if (TID.getOperandConstraint(i, TOI::TIED_TO) != -1) {
Evan Cheng79e97132007-10-05 01:39:18 +0000682 NewSU->isTwoAddress = true;
683 break;
684 }
685 }
Chris Lattnerfd2e3382008-01-07 06:47:00 +0000686 if (TID.isCommutable())
Evan Cheng79e97132007-10-05 01:39:18 +0000687 NewSU->isCommutable = true;
Evan Cheng79e97132007-10-05 01:39:18 +0000688 // FIXME: Calculate height / depth and propagate the changes?
Evan Cheng91e0fc92007-12-18 08:42:10 +0000689 NewSU->Depth = SU->Depth;
690 NewSU->Height = SU->Height;
Evan Cheng79e97132007-10-05 01:39:18 +0000691 ComputeLatency(NewSU);
692
Evan Cheng91e0fc92007-12-18 08:42:10 +0000693 // LoadNode may already exist. This can happen when there is another
694 // load from the same location and producing the same type of value
695 // but it has different alignment or volatileness.
696 bool isNewLoad = true;
697 SUnit *LoadSU;
698 DenseMap<SDNode*, std::vector<SUnit*> >::iterator SMI =
699 SUnitMap.find(LoadNode);
700 if (SMI != SUnitMap.end()) {
701 LoadSU = SMI->second.front();
702 isNewLoad = false;
703 } else {
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000704 LoadSU = CreateNewSUnit(LoadNode);
Evan Cheng91e0fc92007-12-18 08:42:10 +0000705 SUnitMap[LoadNode].push_back(LoadSU);
706
707 LoadSU->Depth = SU->Depth;
708 LoadSU->Height = SU->Height;
709 ComputeLatency(LoadSU);
710 }
711
Evan Cheng79e97132007-10-05 01:39:18 +0000712 SUnit *ChainPred = NULL;
713 SmallVector<SDep, 4> ChainSuccs;
714 SmallVector<SDep, 4> LoadPreds;
715 SmallVector<SDep, 4> NodePreds;
716 SmallVector<SDep, 4> NodeSuccs;
717 for (SUnit::pred_iterator I = SU->Preds.begin(), E = SU->Preds.end();
718 I != E; ++I) {
719 if (I->isCtrl)
720 ChainPred = I->Dep;
Evan Cheng567d2e52008-03-04 00:41:45 +0000721 else if (I->Dep->Node && I->Dep->Node->isOperandOf(LoadNode))
Evan Cheng79e97132007-10-05 01:39:18 +0000722 LoadPreds.push_back(SDep(I->Dep, I->Reg, I->Cost, false, false));
723 else
724 NodePreds.push_back(SDep(I->Dep, I->Reg, I->Cost, false, false));
725 }
726 for (SUnit::succ_iterator I = SU->Succs.begin(), E = SU->Succs.end();
727 I != E; ++I) {
728 if (I->isCtrl)
729 ChainSuccs.push_back(SDep(I->Dep, I->Reg, I->Cost,
730 I->isCtrl, I->isSpecial));
731 else
732 NodeSuccs.push_back(SDep(I->Dep, I->Reg, I->Cost,
733 I->isCtrl, I->isSpecial));
734 }
735
Dan Gohman4370f262008-04-15 01:22:18 +0000736 if (ChainPred) {
737 RemovePred(SU, ChainPred, true, false);
738 if (isNewLoad)
739 AddPred(LoadSU, ChainPred, true, false);
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000740 }
Evan Cheng79e97132007-10-05 01:39:18 +0000741 for (unsigned i = 0, e = LoadPreds.size(); i != e; ++i) {
742 SDep *Pred = &LoadPreds[i];
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000743 RemovePred(SU, Pred->Dep, Pred->isCtrl, Pred->isSpecial);
744 if (isNewLoad) {
745 AddPred(LoadSU, Pred->Dep, Pred->isCtrl, Pred->isSpecial,
Roman Levenstein733a4d62008-03-26 11:23:38 +0000746 Pred->Reg, Pred->Cost);
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000747 }
Evan Cheng79e97132007-10-05 01:39:18 +0000748 }
749 for (unsigned i = 0, e = NodePreds.size(); i != e; ++i) {
750 SDep *Pred = &NodePreds[i];
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000751 RemovePred(SU, Pred->Dep, Pred->isCtrl, Pred->isSpecial);
752 AddPred(NewSU, Pred->Dep, Pred->isCtrl, Pred->isSpecial,
Roman Levenstein733a4d62008-03-26 11:23:38 +0000753 Pred->Reg, Pred->Cost);
Evan Cheng79e97132007-10-05 01:39:18 +0000754 }
755 for (unsigned i = 0, e = NodeSuccs.size(); i != e; ++i) {
756 SDep *Succ = &NodeSuccs[i];
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000757 RemovePred(Succ->Dep, SU, Succ->isCtrl, Succ->isSpecial);
758 AddPred(Succ->Dep, NewSU, Succ->isCtrl, Succ->isSpecial,
Roman Levenstein733a4d62008-03-26 11:23:38 +0000759 Succ->Reg, Succ->Cost);
Evan Cheng79e97132007-10-05 01:39:18 +0000760 }
761 for (unsigned i = 0, e = ChainSuccs.size(); i != e; ++i) {
762 SDep *Succ = &ChainSuccs[i];
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000763 RemovePred(Succ->Dep, SU, Succ->isCtrl, Succ->isSpecial);
764 if (isNewLoad) {
765 AddPred(Succ->Dep, LoadSU, Succ->isCtrl, Succ->isSpecial,
Roman Levenstein733a4d62008-03-26 11:23:38 +0000766 Succ->Reg, Succ->Cost);
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000767 }
Evan Cheng79e97132007-10-05 01:39:18 +0000768 }
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000769 if (isNewLoad) {
770 AddPred(NewSU, LoadSU, false, false);
771 }
Evan Cheng79e97132007-10-05 01:39:18 +0000772
Evan Cheng91e0fc92007-12-18 08:42:10 +0000773 if (isNewLoad)
774 AvailableQueue->addNode(LoadSU);
Evan Cheng79e97132007-10-05 01:39:18 +0000775 AvailableQueue->addNode(NewSU);
776
777 ++NumUnfolds;
778
779 if (NewSU->NumSuccsLeft == 0) {
780 NewSU->isAvailable = true;
781 return NewSU;
Evan Cheng91e0fc92007-12-18 08:42:10 +0000782 }
783 SU = NewSU;
Evan Cheng79e97132007-10-05 01:39:18 +0000784 }
785
786 DOUT << "Duplicating SU # " << SU->NodeNum << "\n";
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000787 NewSU = CreateClone(SU);
Evan Cheng5924bf72007-09-25 01:54:36 +0000788
789 // New SUnit has the exact same predecessors.
790 for (SUnit::pred_iterator I = SU->Preds.begin(), E = SU->Preds.end();
791 I != E; ++I)
792 if (!I->isSpecial) {
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000793 AddPred(NewSU, I->Dep, I->isCtrl, false, I->Reg, I->Cost);
Evan Cheng5924bf72007-09-25 01:54:36 +0000794 NewSU->Depth = std::max(NewSU->Depth, I->Dep->Depth+1);
795 }
796
797 // Only copy scheduled successors. Cut them from old node's successor
798 // list and move them over.
Evan Chengbde499b2007-09-27 07:29:27 +0000799 SmallVector<std::pair<SUnit*, bool>, 4> DelDeps;
Evan Cheng5924bf72007-09-25 01:54:36 +0000800 for (SUnit::succ_iterator I = SU->Succs.begin(), E = SU->Succs.end();
801 I != E; ++I) {
802 if (I->isSpecial)
803 continue;
Evan Cheng5924bf72007-09-25 01:54:36 +0000804 if (I->Dep->isScheduled) {
Evan Chengbde499b2007-09-27 07:29:27 +0000805 NewSU->Height = std::max(NewSU->Height, I->Dep->Height+1);
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000806 AddPred(I->Dep, NewSU, I->isCtrl, false, I->Reg, I->Cost);
Evan Chengbde499b2007-09-27 07:29:27 +0000807 DelDeps.push_back(std::make_pair(I->Dep, I->isCtrl));
Evan Cheng5924bf72007-09-25 01:54:36 +0000808 }
809 }
810 for (unsigned i = 0, e = DelDeps.size(); i != e; ++i) {
Evan Chengbde499b2007-09-27 07:29:27 +0000811 SUnit *Succ = DelDeps[i].first;
812 bool isCtrl = DelDeps[i].second;
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000813 RemovePred(Succ, SU, isCtrl, false);
Evan Cheng5924bf72007-09-25 01:54:36 +0000814 }
815
816 AvailableQueue->updateNode(SU);
817 AvailableQueue->addNode(NewSU);
818
Evan Cheng1ec79b42007-09-27 07:09:03 +0000819 ++NumDups;
Evan Cheng5924bf72007-09-25 01:54:36 +0000820 return NewSU;
821}
822
Evan Cheng1ec79b42007-09-27 07:09:03 +0000823/// InsertCCCopiesAndMoveSuccs - Insert expensive cross register class copies
824/// and move all scheduled successors of the given SUnit to the last copy.
825void ScheduleDAGRRList::InsertCCCopiesAndMoveSuccs(SUnit *SU, unsigned Reg,
826 const TargetRegisterClass *DestRC,
827 const TargetRegisterClass *SrcRC,
828 SmallVector<SUnit*, 2> &Copies) {
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000829 SUnit *CopyFromSU = CreateNewSUnit(NULL);
Evan Cheng8e136a92007-09-26 21:36:17 +0000830 CopyFromSU->CopySrcRC = SrcRC;
831 CopyFromSU->CopyDstRC = DestRC;
832 CopyFromSU->Depth = SU->Depth;
833 CopyFromSU->Height = SU->Height;
834
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000835 SUnit *CopyToSU = CreateNewSUnit(NULL);
Evan Cheng8e136a92007-09-26 21:36:17 +0000836 CopyToSU->CopySrcRC = DestRC;
837 CopyToSU->CopyDstRC = SrcRC;
838
839 // Only copy scheduled successors. Cut them from old node's successor
840 // list and move them over.
Evan Chengbde499b2007-09-27 07:29:27 +0000841 SmallVector<std::pair<SUnit*, bool>, 4> DelDeps;
Evan Cheng8e136a92007-09-26 21:36:17 +0000842 for (SUnit::succ_iterator I = SU->Succs.begin(), E = SU->Succs.end();
843 I != E; ++I) {
844 if (I->isSpecial)
845 continue;
Evan Cheng8e136a92007-09-26 21:36:17 +0000846 if (I->Dep->isScheduled) {
Evan Chengbde499b2007-09-27 07:29:27 +0000847 CopyToSU->Height = std::max(CopyToSU->Height, I->Dep->Height+1);
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000848 AddPred(I->Dep, CopyToSU, I->isCtrl, false, I->Reg, I->Cost);
Evan Chengbde499b2007-09-27 07:29:27 +0000849 DelDeps.push_back(std::make_pair(I->Dep, I->isCtrl));
Evan Cheng8e136a92007-09-26 21:36:17 +0000850 }
851 }
852 for (unsigned i = 0, e = DelDeps.size(); i != e; ++i) {
Evan Chengbde499b2007-09-27 07:29:27 +0000853 SUnit *Succ = DelDeps[i].first;
854 bool isCtrl = DelDeps[i].second;
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000855 RemovePred(Succ, SU, isCtrl, false);
Evan Cheng8e136a92007-09-26 21:36:17 +0000856 }
857
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000858 AddPred(CopyFromSU, SU, false, false, Reg, -1);
859 AddPred(CopyToSU, CopyFromSU, false, false, Reg, 1);
Evan Cheng8e136a92007-09-26 21:36:17 +0000860
861 AvailableQueue->updateNode(SU);
862 AvailableQueue->addNode(CopyFromSU);
863 AvailableQueue->addNode(CopyToSU);
Evan Cheng1ec79b42007-09-27 07:09:03 +0000864 Copies.push_back(CopyFromSU);
865 Copies.push_back(CopyToSU);
Evan Cheng8e136a92007-09-26 21:36:17 +0000866
Evan Cheng1ec79b42007-09-27 07:09:03 +0000867 ++NumCCCopies;
Evan Cheng8e136a92007-09-26 21:36:17 +0000868}
869
870/// getPhysicalRegisterVT - Returns the ValueType of the physical register
871/// definition of the specified node.
872/// FIXME: Move to SelectionDAG?
873static MVT::ValueType getPhysicalRegisterVT(SDNode *N, unsigned Reg,
874 const TargetInstrInfo *TII) {
Chris Lattner03ad8852008-01-07 07:27:27 +0000875 const TargetInstrDesc &TID = TII->get(N->getTargetOpcode());
Evan Cheng8e136a92007-09-26 21:36:17 +0000876 assert(TID.ImplicitDefs && "Physical reg def must be in implicit def list!");
Chris Lattnerb0d06b42008-01-07 03:13:06 +0000877 unsigned NumRes = TID.getNumDefs();
878 for (const unsigned *ImpDef = TID.getImplicitDefs(); *ImpDef; ++ImpDef) {
Evan Cheng8e136a92007-09-26 21:36:17 +0000879 if (Reg == *ImpDef)
880 break;
881 ++NumRes;
882 }
883 return N->getValueType(NumRes);
884}
885
Evan Cheng5924bf72007-09-25 01:54:36 +0000886/// DelayForLiveRegsBottomUp - Returns true if it is necessary to delay
887/// scheduling of the given node to satisfy live physical register dependencies.
888/// If the specific node is the last one that's available to schedule, do
889/// whatever is necessary (i.e. backtracking or cloning) to make it possible.
Evan Cheng1ec79b42007-09-27 07:09:03 +0000890bool ScheduleDAGRRList::DelayForLiveRegsBottomUp(SUnit *SU,
891 SmallVector<unsigned, 4> &LRegs){
Evan Cheng5924bf72007-09-25 01:54:36 +0000892 if (LiveRegs.empty())
893 return false;
894
Evan Chenge6f92252007-09-27 18:46:06 +0000895 SmallSet<unsigned, 4> RegAdded;
Evan Cheng5924bf72007-09-25 01:54:36 +0000896 // If this node would clobber any "live" register, then it's not ready.
Evan Cheng5924bf72007-09-25 01:54:36 +0000897 for (SUnit::pred_iterator I = SU->Preds.begin(), E = SU->Preds.end();
898 I != E; ++I) {
899 if (I->Cost < 0) {
900 unsigned Reg = I->Reg;
Evan Chenge6f92252007-09-27 18:46:06 +0000901 if (LiveRegs.count(Reg) && LiveRegDefs[Reg] != I->Dep) {
902 if (RegAdded.insert(Reg))
903 LRegs.push_back(Reg);
904 }
Dan Gohman3a4be0f2008-02-10 18:45:23 +0000905 for (const unsigned *Alias = TRI->getAliasSet(Reg);
Evan Cheng5924bf72007-09-25 01:54:36 +0000906 *Alias; ++Alias)
Evan Chenge6f92252007-09-27 18:46:06 +0000907 if (LiveRegs.count(*Alias) && LiveRegDefs[*Alias] != I->Dep) {
908 if (RegAdded.insert(*Alias))
909 LRegs.push_back(*Alias);
910 }
Evan Cheng5924bf72007-09-25 01:54:36 +0000911 }
912 }
913
914 for (unsigned i = 0, e = SU->FlaggedNodes.size()+1; i != e; ++i) {
915 SDNode *Node = (i == 0) ? SU->Node : SU->FlaggedNodes[i-1];
Evan Cheng8e136a92007-09-26 21:36:17 +0000916 if (!Node || !Node->isTargetOpcode())
Evan Cheng5924bf72007-09-25 01:54:36 +0000917 continue;
Chris Lattner03ad8852008-01-07 07:27:27 +0000918 const TargetInstrDesc &TID = TII->get(Node->getTargetOpcode());
Evan Cheng5924bf72007-09-25 01:54:36 +0000919 if (!TID.ImplicitDefs)
920 continue;
921 for (const unsigned *Reg = TID.ImplicitDefs; *Reg; ++Reg) {
Evan Chenge6f92252007-09-27 18:46:06 +0000922 if (LiveRegs.count(*Reg) && LiveRegDefs[*Reg] != SU) {
923 if (RegAdded.insert(*Reg))
924 LRegs.push_back(*Reg);
925 }
Dan Gohman3a4be0f2008-02-10 18:45:23 +0000926 for (const unsigned *Alias = TRI->getAliasSet(*Reg);
Evan Cheng5924bf72007-09-25 01:54:36 +0000927 *Alias; ++Alias)
Evan Chenge6f92252007-09-27 18:46:06 +0000928 if (LiveRegs.count(*Alias) && LiveRegDefs[*Alias] != SU) {
929 if (RegAdded.insert(*Alias))
930 LRegs.push_back(*Alias);
931 }
Evan Cheng5924bf72007-09-25 01:54:36 +0000932 }
933 }
Evan Cheng5924bf72007-09-25 01:54:36 +0000934 return !LRegs.empty();
Evan Chengd38c22b2006-05-11 23:55:42 +0000935}
936
Evan Cheng1ec79b42007-09-27 07:09:03 +0000937
Evan Chengd38c22b2006-05-11 23:55:42 +0000938/// ListScheduleBottomUp - The main loop of list scheduling for bottom-up
939/// schedulers.
940void ScheduleDAGRRList::ListScheduleBottomUp() {
941 unsigned CurCycle = 0;
942 // Add root to Available queue.
Dan Gohman4370f262008-04-15 01:22:18 +0000943 if (!SUnits.empty()) {
944 SUnit *RootSU = SUnitMap[DAG.getRoot().Val].front();
945 assert(RootSU->Succs.empty() && "Graph root shouldn't have successors!");
946 RootSU->isAvailable = true;
947 AvailableQueue->push(RootSU);
948 }
Evan Chengd38c22b2006-05-11 23:55:42 +0000949
950 // While Available queue is not empty, grab the node with the highest
Dan Gohman54a187e2007-08-20 19:28:38 +0000951 // priority. If it is not ready put it back. Schedule the node.
Evan Cheng5924bf72007-09-25 01:54:36 +0000952 SmallVector<SUnit*, 4> NotReady;
Evan Chengd38c22b2006-05-11 23:55:42 +0000953 while (!AvailableQueue->empty()) {
Evan Cheng1ec79b42007-09-27 07:09:03 +0000954 bool Delayed = false;
955 DenseMap<SUnit*, SmallVector<unsigned, 4> > LRegsMap;
Evan Cheng5924bf72007-09-25 01:54:36 +0000956 SUnit *CurSU = AvailableQueue->pop();
957 while (CurSU) {
Evan Cheng1ec79b42007-09-27 07:09:03 +0000958 if (CurSU->CycleBound <= CurCycle) {
959 SmallVector<unsigned, 4> LRegs;
960 if (!DelayForLiveRegsBottomUp(CurSU, LRegs))
Evan Cheng5924bf72007-09-25 01:54:36 +0000961 break;
Evan Cheng1ec79b42007-09-27 07:09:03 +0000962 Delayed = true;
963 LRegsMap.insert(std::make_pair(CurSU, LRegs));
Evan Cheng5924bf72007-09-25 01:54:36 +0000964 }
Evan Cheng1ec79b42007-09-27 07:09:03 +0000965
966 CurSU->isPending = true; // This SU is not in AvailableQueue right now.
967 NotReady.push_back(CurSU);
Evan Cheng5924bf72007-09-25 01:54:36 +0000968 CurSU = AvailableQueue->pop();
Evan Chengd38c22b2006-05-11 23:55:42 +0000969 }
Evan Cheng1ec79b42007-09-27 07:09:03 +0000970
971 // All candidates are delayed due to live physical reg dependencies.
972 // Try backtracking, code duplication, or inserting cross class copies
973 // to resolve it.
974 if (Delayed && !CurSU) {
975 for (unsigned i = 0, e = NotReady.size(); i != e; ++i) {
976 SUnit *TrySU = NotReady[i];
977 SmallVector<unsigned, 4> &LRegs = LRegsMap[TrySU];
978
979 // Try unscheduling up to the point where it's safe to schedule
980 // this node.
981 unsigned LiveCycle = CurCycle;
982 for (unsigned j = 0, ee = LRegs.size(); j != ee; ++j) {
983 unsigned Reg = LRegs[j];
984 unsigned LCycle = LiveRegCycles[Reg];
985 LiveCycle = std::min(LiveCycle, LCycle);
986 }
987 SUnit *OldSU = Sequence[LiveCycle];
988 if (!WillCreateCycle(TrySU, OldSU)) {
989 BacktrackBottomUp(TrySU, LiveCycle, CurCycle);
990 // Force the current node to be scheduled before the node that
991 // requires the physical reg dep.
992 if (OldSU->isAvailable) {
993 OldSU->isAvailable = false;
994 AvailableQueue->remove(OldSU);
995 }
Roman Levenstein7e71b4b2008-03-26 09:18:09 +0000996 AddPred(TrySU, OldSU, true, true);
Evan Cheng1ec79b42007-09-27 07:09:03 +0000997 // If one or more successors has been unscheduled, then the current
998 // node is no longer avaialable. Schedule a successor that's now
999 // available instead.
1000 if (!TrySU->isAvailable)
1001 CurSU = AvailableQueue->pop();
1002 else {
1003 CurSU = TrySU;
1004 TrySU->isPending = false;
1005 NotReady.erase(NotReady.begin()+i);
1006 }
1007 break;
1008 }
1009 }
1010
1011 if (!CurSU) {
Dan Gohmanfd227e92008-03-25 17:10:29 +00001012 // Can't backtrack. Try duplicating the nodes that produces these
Evan Cheng1ec79b42007-09-27 07:09:03 +00001013 // "expensive to copy" values to break the dependency. In case even
1014 // that doesn't work, insert cross class copies.
1015 SUnit *TrySU = NotReady[0];
1016 SmallVector<unsigned, 4> &LRegs = LRegsMap[TrySU];
1017 assert(LRegs.size() == 1 && "Can't handle this yet!");
1018 unsigned Reg = LRegs[0];
1019 SUnit *LRDef = LiveRegDefs[Reg];
Evan Cheng79e97132007-10-05 01:39:18 +00001020 SUnit *NewDef = CopyAndMoveSuccessors(LRDef);
1021 if (!NewDef) {
Evan Cheng1ec79b42007-09-27 07:09:03 +00001022 // Issue expensive cross register class copies.
1023 MVT::ValueType VT = getPhysicalRegisterVT(LRDef->Node, Reg, TII);
1024 const TargetRegisterClass *RC =
Evan Chenge88a6252008-03-11 07:19:34 +00001025 TRI->getPhysicalRegisterRegClass(Reg, VT);
Dan Gohman3a4be0f2008-02-10 18:45:23 +00001026 const TargetRegisterClass *DestRC = TRI->getCrossCopyRegClass(RC);
Evan Cheng1ec79b42007-09-27 07:09:03 +00001027 if (!DestRC) {
1028 assert(false && "Don't know how to copy this physical register!");
1029 abort();
1030 }
1031 SmallVector<SUnit*, 2> Copies;
1032 InsertCCCopiesAndMoveSuccs(LRDef, Reg, DestRC, RC, Copies);
1033 DOUT << "Adding an edge from SU # " << TrySU->NodeNum
1034 << " to SU #" << Copies.front()->NodeNum << "\n";
Roman Levenstein7e71b4b2008-03-26 09:18:09 +00001035 AddPred(TrySU, Copies.front(), true, true);
Evan Cheng1ec79b42007-09-27 07:09:03 +00001036 NewDef = Copies.back();
1037 }
1038
1039 DOUT << "Adding an edge from SU # " << NewDef->NodeNum
1040 << " to SU #" << TrySU->NodeNum << "\n";
1041 LiveRegDefs[Reg] = NewDef;
Roman Levenstein7e71b4b2008-03-26 09:18:09 +00001042 AddPred(NewDef, TrySU, true, true);
Evan Cheng1ec79b42007-09-27 07:09:03 +00001043 TrySU->isAvailable = false;
1044 CurSU = NewDef;
1045 }
1046
1047 if (!CurSU) {
1048 assert(false && "Unable to resolve live physical register dependencies!");
1049 abort();
1050 }
1051 }
1052
Evan Chengd38c22b2006-05-11 23:55:42 +00001053 // Add the nodes that aren't ready back onto the available list.
Evan Cheng5924bf72007-09-25 01:54:36 +00001054 for (unsigned i = 0, e = NotReady.size(); i != e; ++i) {
1055 NotReady[i]->isPending = false;
Evan Cheng1ec79b42007-09-27 07:09:03 +00001056 // May no longer be available due to backtracking.
Evan Cheng5924bf72007-09-25 01:54:36 +00001057 if (NotReady[i]->isAvailable)
1058 AvailableQueue->push(NotReady[i]);
1059 }
Evan Chengd38c22b2006-05-11 23:55:42 +00001060 NotReady.clear();
1061
Evan Cheng5924bf72007-09-25 01:54:36 +00001062 if (!CurSU)
1063 Sequence.push_back(0);
1064 else {
1065 ScheduleNodeBottomUp(CurSU, CurCycle);
1066 Sequence.push_back(CurSU);
1067 }
1068 ++CurCycle;
Evan Chengd38c22b2006-05-11 23:55:42 +00001069 }
1070
Evan Chengd38c22b2006-05-11 23:55:42 +00001071 // Reverse the order if it is bottom up.
1072 std::reverse(Sequence.begin(), Sequence.end());
1073
1074
1075#ifndef NDEBUG
1076 // Verify that all SUnits were scheduled.
1077 bool AnyNotSched = false;
Dan Gohman4370f262008-04-15 01:22:18 +00001078 unsigned DeadNodes = 0;
Evan Chengd38c22b2006-05-11 23:55:42 +00001079 for (unsigned i = 0, e = SUnits.size(); i != e; ++i) {
Dan Gohman4370f262008-04-15 01:22:18 +00001080 if (!SUnits[i].isScheduled) {
1081 if (SUnits[i].NumPreds == 0 && SUnits[i].NumSuccs == 0) {
1082 ++DeadNodes;
1083 continue;
1084 }
Evan Chengd38c22b2006-05-11 23:55:42 +00001085 if (!AnyNotSched)
Bill Wendling22e978a2006-12-07 20:04:42 +00001086 cerr << "*** List scheduling failed! ***\n";
Evan Chengd38c22b2006-05-11 23:55:42 +00001087 SUnits[i].dump(&DAG);
Bill Wendling22e978a2006-12-07 20:04:42 +00001088 cerr << "has not been scheduled!\n";
Evan Chengd38c22b2006-05-11 23:55:42 +00001089 AnyNotSched = true;
1090 }
Dan Gohman4370f262008-04-15 01:22:18 +00001091 if (SUnits[i].NumSuccsLeft != 0) {
1092 if (!AnyNotSched)
1093 cerr << "*** List scheduling failed! ***\n";
1094 SUnits[i].dump(&DAG);
1095 cerr << "has successors left!\n";
1096 AnyNotSched = true;
1097 }
Evan Chengd38c22b2006-05-11 23:55:42 +00001098 }
1099 assert(!AnyNotSched);
Dan Gohman4370f262008-04-15 01:22:18 +00001100 assert(Sequence.size() + DeadNodes == SUnits.size() &&
1101 "The number of nodes scheduled doesn't match the expected number!");
Evan Chengd38c22b2006-05-11 23:55:42 +00001102#endif
1103}
1104
1105//===----------------------------------------------------------------------===//
1106// Top-Down Scheduling
1107//===----------------------------------------------------------------------===//
1108
1109/// ReleaseSucc - Decrement the NumPredsLeft count of a successor. Add it to
Dan Gohman54a187e2007-08-20 19:28:38 +00001110/// the AvailableQueue if the count reaches zero. Also update its cycle bound.
Evan Chengd38c22b2006-05-11 23:55:42 +00001111void ScheduleDAGRRList::ReleaseSucc(SUnit *SuccSU, bool isChain,
1112 unsigned CurCycle) {
1113 // FIXME: the distance between two nodes is not always == the predecessor's
1114 // latency. For example, the reader can very well read the register written
1115 // by the predecessor later than the issue cycle. It also depends on the
1116 // interrupt model (drain vs. freeze).
1117 SuccSU->CycleBound = std::max(SuccSU->CycleBound, CurCycle + SuccSU->Latency);
1118
Evan Cheng038dcc52007-09-28 19:24:24 +00001119 --SuccSU->NumPredsLeft;
Evan Chengd38c22b2006-05-11 23:55:42 +00001120
1121#ifndef NDEBUG
Evan Cheng038dcc52007-09-28 19:24:24 +00001122 if (SuccSU->NumPredsLeft < 0) {
Bill Wendling22e978a2006-12-07 20:04:42 +00001123 cerr << "*** List scheduling failed! ***\n";
Evan Chengd38c22b2006-05-11 23:55:42 +00001124 SuccSU->dump(&DAG);
Bill Wendling22e978a2006-12-07 20:04:42 +00001125 cerr << " has been released too many times!\n";
Evan Chengd38c22b2006-05-11 23:55:42 +00001126 assert(0);
1127 }
1128#endif
1129
Evan Cheng038dcc52007-09-28 19:24:24 +00001130 if (SuccSU->NumPredsLeft == 0) {
Evan Chengd38c22b2006-05-11 23:55:42 +00001131 SuccSU->isAvailable = true;
1132 AvailableQueue->push(SuccSU);
1133 }
1134}
1135
1136
1137/// ScheduleNodeTopDown - Add the node to the schedule. Decrement the pending
1138/// count of its successors. If a successor pending count is zero, add it to
1139/// the Available queue.
Evan Chengd12c97d2006-05-30 18:05:39 +00001140void ScheduleDAGRRList::ScheduleNodeTopDown(SUnit *SU, unsigned CurCycle) {
Bill Wendling22e978a2006-12-07 20:04:42 +00001141 DOUT << "*** Scheduling [" << CurCycle << "]: ";
Evan Chengd38c22b2006-05-11 23:55:42 +00001142 DEBUG(SU->dump(&DAG));
1143 SU->Cycle = CurCycle;
1144
1145 AvailableQueue->ScheduledNode(SU);
Evan Chengd38c22b2006-05-11 23:55:42 +00001146
1147 // Top down: release successors
Chris Lattnerd86418a2006-08-17 00:09:56 +00001148 for (SUnit::succ_iterator I = SU->Succs.begin(), E = SU->Succs.end();
1149 I != E; ++I)
Evan Cheng0effc3a2007-09-19 01:38:40 +00001150 ReleaseSucc(I->Dep, I->isCtrl, CurCycle);
Evan Chengd38c22b2006-05-11 23:55:42 +00001151 SU->isScheduled = true;
Evan Chengd38c22b2006-05-11 23:55:42 +00001152}
1153
Dan Gohman54a187e2007-08-20 19:28:38 +00001154/// ListScheduleTopDown - The main loop of list scheduling for top-down
1155/// schedulers.
Evan Chengd38c22b2006-05-11 23:55:42 +00001156void ScheduleDAGRRList::ListScheduleTopDown() {
1157 unsigned CurCycle = 0;
Evan Chengd38c22b2006-05-11 23:55:42 +00001158
1159 // All leaves to Available queue.
1160 for (unsigned i = 0, e = SUnits.size(); i != e; ++i) {
1161 // It is available if it has no predecessors.
Dan Gohman4370f262008-04-15 01:22:18 +00001162 if (SUnits[i].Preds.empty()) {
Evan Chengd38c22b2006-05-11 23:55:42 +00001163 AvailableQueue->push(&SUnits[i]);
1164 SUnits[i].isAvailable = true;
1165 }
1166 }
1167
Evan Chengd38c22b2006-05-11 23:55:42 +00001168 // While Available queue is not empty, grab the node with the highest
Dan Gohman54a187e2007-08-20 19:28:38 +00001169 // priority. If it is not ready put it back. Schedule the node.
Evan Chengd38c22b2006-05-11 23:55:42 +00001170 std::vector<SUnit*> NotReady;
Evan Chengd38c22b2006-05-11 23:55:42 +00001171 while (!AvailableQueue->empty()) {
Evan Cheng5924bf72007-09-25 01:54:36 +00001172 SUnit *CurSU = AvailableQueue->pop();
1173 while (CurSU && CurSU->CycleBound > CurCycle) {
1174 NotReady.push_back(CurSU);
1175 CurSU = AvailableQueue->pop();
Evan Chengd38c22b2006-05-11 23:55:42 +00001176 }
1177
1178 // Add the nodes that aren't ready back onto the available list.
1179 AvailableQueue->push_all(NotReady);
1180 NotReady.clear();
1181
Evan Cheng5924bf72007-09-25 01:54:36 +00001182 if (!CurSU)
1183 Sequence.push_back(0);
1184 else {
1185 ScheduleNodeTopDown(CurSU, CurCycle);
1186 Sequence.push_back(CurSU);
1187 }
Dan Gohman4370f262008-04-15 01:22:18 +00001188 ++CurCycle;
Evan Chengd38c22b2006-05-11 23:55:42 +00001189 }
1190
1191
1192#ifndef NDEBUG
1193 // Verify that all SUnits were scheduled.
1194 bool AnyNotSched = false;
Dan Gohman4370f262008-04-15 01:22:18 +00001195 unsigned DeadNodes = 0;
Evan Chengd38c22b2006-05-11 23:55:42 +00001196 for (unsigned i = 0, e = SUnits.size(); i != e; ++i) {
1197 if (!SUnits[i].isScheduled) {
Dan Gohman4370f262008-04-15 01:22:18 +00001198 if (SUnits[i].NumPreds == 0 && SUnits[i].NumSuccs == 0) {
1199 ++DeadNodes;
1200 continue;
1201 }
Evan Chengd38c22b2006-05-11 23:55:42 +00001202 if (!AnyNotSched)
Bill Wendling22e978a2006-12-07 20:04:42 +00001203 cerr << "*** List scheduling failed! ***\n";
Evan Chengd38c22b2006-05-11 23:55:42 +00001204 SUnits[i].dump(&DAG);
Bill Wendling22e978a2006-12-07 20:04:42 +00001205 cerr << "has not been scheduled!\n";
Evan Chengd38c22b2006-05-11 23:55:42 +00001206 AnyNotSched = true;
1207 }
Dan Gohman4370f262008-04-15 01:22:18 +00001208 if (SUnits[i].NumPredsLeft != 0) {
1209 if (!AnyNotSched)
1210 cerr << "*** List scheduling failed! ***\n";
1211 SUnits[i].dump(&DAG);
1212 cerr << "has predecessors left!\n";
1213 AnyNotSched = true;
1214 }
Evan Chengd38c22b2006-05-11 23:55:42 +00001215 }
1216 assert(!AnyNotSched);
Dan Gohman4370f262008-04-15 01:22:18 +00001217 assert(Sequence.size() + DeadNodes == SUnits.size() &&
1218 "The number of nodes scheduled doesn't match the expected number!");
Evan Chengd38c22b2006-05-11 23:55:42 +00001219#endif
1220}
1221
1222
1223
1224//===----------------------------------------------------------------------===//
1225// RegReductionPriorityQueue Implementation
1226//===----------------------------------------------------------------------===//
1227//
1228// This is a SchedulingPriorityQueue that schedules using Sethi Ullman numbers
1229// to reduce register pressure.
1230//
1231namespace {
1232 template<class SF>
1233 class RegReductionPriorityQueue;
1234
1235 /// Sorting functions for the Available queue.
1236 struct bu_ls_rr_sort : public std::binary_function<SUnit*, SUnit*, bool> {
1237 RegReductionPriorityQueue<bu_ls_rr_sort> *SPQ;
1238 bu_ls_rr_sort(RegReductionPriorityQueue<bu_ls_rr_sort> *spq) : SPQ(spq) {}
1239 bu_ls_rr_sort(const bu_ls_rr_sort &RHS) : SPQ(RHS.SPQ) {}
1240
1241 bool operator()(const SUnit* left, const SUnit* right) const;
1242 };
1243
1244 struct td_ls_rr_sort : public std::binary_function<SUnit*, SUnit*, bool> {
1245 RegReductionPriorityQueue<td_ls_rr_sort> *SPQ;
1246 td_ls_rr_sort(RegReductionPriorityQueue<td_ls_rr_sort> *spq) : SPQ(spq) {}
1247 td_ls_rr_sort(const td_ls_rr_sort &RHS) : SPQ(RHS.SPQ) {}
1248
1249 bool operator()(const SUnit* left, const SUnit* right) const;
1250 };
1251} // end anonymous namespace
1252
Evan Cheng961bbd32007-01-08 23:50:38 +00001253static inline bool isCopyFromLiveIn(const SUnit *SU) {
1254 SDNode *N = SU->Node;
Evan Cheng8e136a92007-09-26 21:36:17 +00001255 return N && N->getOpcode() == ISD::CopyFromReg &&
Evan Cheng961bbd32007-01-08 23:50:38 +00001256 N->getOperand(N->getNumOperands()-1).getValueType() != MVT::Flag;
1257}
1258
Evan Chengd38c22b2006-05-11 23:55:42 +00001259namespace {
1260 template<class SF>
Chris Lattner996795b2006-06-28 23:17:24 +00001261 class VISIBILITY_HIDDEN RegReductionPriorityQueue
1262 : public SchedulingPriorityQueue {
Evan Chengd38c22b2006-05-11 23:55:42 +00001263 std::priority_queue<SUnit*, std::vector<SUnit*>, SF> Queue;
1264
1265 public:
1266 RegReductionPriorityQueue() :
1267 Queue(SF(this)) {}
1268
Evan Cheng5924bf72007-09-25 01:54:36 +00001269 virtual void initNodes(DenseMap<SDNode*, std::vector<SUnit*> > &sumap,
Evan Chengfd2c5dd2006-11-04 09:44:31 +00001270 std::vector<SUnit> &sunits) {}
Evan Cheng5924bf72007-09-25 01:54:36 +00001271
1272 virtual void addNode(const SUnit *SU) {}
1273
1274 virtual void updateNode(const SUnit *SU) {}
1275
Evan Chengd38c22b2006-05-11 23:55:42 +00001276 virtual void releaseState() {}
1277
Evan Cheng6730f032007-01-08 23:55:53 +00001278 virtual unsigned getNodePriority(const SUnit *SU) const {
Evan Chengd38c22b2006-05-11 23:55:42 +00001279 return 0;
1280 }
1281
Evan Cheng5924bf72007-09-25 01:54:36 +00001282 unsigned size() const { return Queue.size(); }
1283
Evan Chengd38c22b2006-05-11 23:55:42 +00001284 bool empty() const { return Queue.empty(); }
1285
1286 void push(SUnit *U) {
1287 Queue.push(U);
1288 }
1289 void push_all(const std::vector<SUnit *> &Nodes) {
1290 for (unsigned i = 0, e = Nodes.size(); i != e; ++i)
1291 Queue.push(Nodes[i]);
1292 }
1293
1294 SUnit *pop() {
Evan Chengd12c97d2006-05-30 18:05:39 +00001295 if (empty()) return NULL;
Evan Chengd38c22b2006-05-11 23:55:42 +00001296 SUnit *V = Queue.top();
1297 Queue.pop();
1298 return V;
1299 }
Evan Chengfd2c5dd2006-11-04 09:44:31 +00001300
Evan Cheng5924bf72007-09-25 01:54:36 +00001301 /// remove - This is a really inefficient way to remove a node from a
1302 /// priority queue. We should roll our own heap to make this better or
1303 /// something.
1304 void remove(SUnit *SU) {
1305 std::vector<SUnit*> Temp;
1306
1307 assert(!Queue.empty() && "Not in queue!");
1308 while (Queue.top() != SU) {
1309 Temp.push_back(Queue.top());
1310 Queue.pop();
1311 assert(!Queue.empty() && "Not in queue!");
1312 }
1313
1314 // Remove the node from the PQ.
1315 Queue.pop();
1316
1317 // Add all the other nodes back.
1318 for (unsigned i = 0, e = Temp.size(); i != e; ++i)
1319 Queue.push(Temp[i]);
Evan Chengfd2c5dd2006-11-04 09:44:31 +00001320 }
Evan Chengd38c22b2006-05-11 23:55:42 +00001321 };
1322
1323 template<class SF>
Chris Lattner996795b2006-06-28 23:17:24 +00001324 class VISIBILITY_HIDDEN BURegReductionPriorityQueue
1325 : public RegReductionPriorityQueue<SF> {
Evan Cheng5924bf72007-09-25 01:54:36 +00001326 // SUnitMap SDNode to SUnit mapping (n -> n).
1327 DenseMap<SDNode*, std::vector<SUnit*> > *SUnitMap;
Evan Chengfd2c5dd2006-11-04 09:44:31 +00001328
Evan Chengd38c22b2006-05-11 23:55:42 +00001329 // SUnits - The SUnits for the current graph.
1330 const std::vector<SUnit> *SUnits;
1331
1332 // SethiUllmanNumbers - The SethiUllman number for each node.
Evan Cheng961bbd32007-01-08 23:50:38 +00001333 std::vector<unsigned> SethiUllmanNumbers;
Evan Chengd38c22b2006-05-11 23:55:42 +00001334
Evan Chengfd2c5dd2006-11-04 09:44:31 +00001335 const TargetInstrInfo *TII;
Dan Gohman3a4be0f2008-02-10 18:45:23 +00001336 const TargetRegisterInfo *TRI;
Roman Levenstein7e71b4b2008-03-26 09:18:09 +00001337 ScheduleDAGRRList *scheduleDAG;
Evan Chengd38c22b2006-05-11 23:55:42 +00001338 public:
Evan Chengf9891412007-12-20 09:25:31 +00001339 explicit BURegReductionPriorityQueue(const TargetInstrInfo *tii,
Dan Gohman3a4be0f2008-02-10 18:45:23 +00001340 const TargetRegisterInfo *tri)
Roman Levenstein7e71b4b2008-03-26 09:18:09 +00001341 : TII(tii), TRI(tri), scheduleDAG(NULL) {}
Evan Chengd38c22b2006-05-11 23:55:42 +00001342
Evan Cheng5924bf72007-09-25 01:54:36 +00001343 void initNodes(DenseMap<SDNode*, std::vector<SUnit*> > &sumap,
Evan Chengfd2c5dd2006-11-04 09:44:31 +00001344 std::vector<SUnit> &sunits) {
1345 SUnitMap = &sumap;
Evan Chengd38c22b2006-05-11 23:55:42 +00001346 SUnits = &sunits;
1347 // Add pseudo dependency edges for two-address nodes.
Evan Chengafed73e2006-05-12 01:58:24 +00001348 AddPseudoTwoAddrDeps();
Evan Chengd38c22b2006-05-11 23:55:42 +00001349 // Calculate node priorities.
Evan Cheng6730f032007-01-08 23:55:53 +00001350 CalculateSethiUllmanNumbers();
Evan Chengd38c22b2006-05-11 23:55:42 +00001351 }
1352
Evan Cheng5924bf72007-09-25 01:54:36 +00001353 void addNode(const SUnit *SU) {
1354 SethiUllmanNumbers.resize(SUnits->size(), 0);
1355 CalcNodeSethiUllmanNumber(SU);
1356 }
1357
1358 void updateNode(const SUnit *SU) {
1359 SethiUllmanNumbers[SU->NodeNum] = 0;
1360 CalcNodeSethiUllmanNumber(SU);
1361 }
1362
Evan Chengd38c22b2006-05-11 23:55:42 +00001363 void releaseState() {
1364 SUnits = 0;
1365 SethiUllmanNumbers.clear();
1366 }
1367
Evan Cheng6730f032007-01-08 23:55:53 +00001368 unsigned getNodePriority(const SUnit *SU) const {
Evan Cheng961bbd32007-01-08 23:50:38 +00001369 assert(SU->NodeNum < SethiUllmanNumbers.size());
Evan Cheng8e136a92007-09-26 21:36:17 +00001370 unsigned Opc = SU->Node ? SU->Node->getOpcode() : 0;
Evan Cheng961bbd32007-01-08 23:50:38 +00001371 if (Opc == ISD::CopyFromReg && !isCopyFromLiveIn(SU))
1372 // CopyFromReg should be close to its def because it restricts
1373 // allocation choices. But if it is a livein then perhaps we want it
1374 // closer to its uses so it can be coalesced.
1375 return 0xffff;
1376 else if (Opc == ISD::TokenFactor || Opc == ISD::CopyToReg)
1377 // CopyToReg should be close to its uses to facilitate coalescing and
1378 // avoid spilling.
1379 return 0;
Evan Chengaa2d6ef2007-10-12 08:50:34 +00001380 else if (Opc == TargetInstrInfo::EXTRACT_SUBREG ||
1381 Opc == TargetInstrInfo::INSERT_SUBREG)
1382 // EXTRACT_SUBREG / INSERT_SUBREG should be close to its use to
1383 // facilitate coalescing.
1384 return 0;
Evan Cheng961bbd32007-01-08 23:50:38 +00001385 else if (SU->NumSuccs == 0)
1386 // If SU does not have a use, i.e. it doesn't produce a value that would
1387 // be consumed (e.g. store), then it terminates a chain of computation.
1388 // Give it a large SethiUllman number so it will be scheduled right
1389 // before its predecessors that it doesn't lengthen their live ranges.
1390 return 0xffff;
1391 else if (SU->NumPreds == 0)
1392 // If SU does not have a def, schedule it close to its uses because it
1393 // does not lengthen any live ranges.
1394 return 0;
1395 else
1396 return SethiUllmanNumbers[SU->NodeNum];
Evan Chengd38c22b2006-05-11 23:55:42 +00001397 }
1398
Roman Levenstein7e71b4b2008-03-26 09:18:09 +00001399 void setScheduleDAG(ScheduleDAGRRList *scheduleDag) {
1400 scheduleDAG = scheduleDag;
1401 }
1402
Evan Chengd38c22b2006-05-11 23:55:42 +00001403 private:
Evan Cheng73bdf042008-03-01 00:39:47 +00001404 bool canClobber(const SUnit *SU, const SUnit *Op);
Evan Chengd38c22b2006-05-11 23:55:42 +00001405 void AddPseudoTwoAddrDeps();
Evan Cheng6730f032007-01-08 23:55:53 +00001406 void CalculateSethiUllmanNumbers();
1407 unsigned CalcNodeSethiUllmanNumber(const SUnit *SU);
Evan Chengd38c22b2006-05-11 23:55:42 +00001408 };
1409
1410
1411 template<class SF>
Dan Gohman54a187e2007-08-20 19:28:38 +00001412 class VISIBILITY_HIDDEN TDRegReductionPriorityQueue
1413 : public RegReductionPriorityQueue<SF> {
Evan Cheng5924bf72007-09-25 01:54:36 +00001414 // SUnitMap SDNode to SUnit mapping (n -> n).
1415 DenseMap<SDNode*, std::vector<SUnit*> > *SUnitMap;
Evan Chengfd2c5dd2006-11-04 09:44:31 +00001416
Evan Chengd38c22b2006-05-11 23:55:42 +00001417 // SUnits - The SUnits for the current graph.
1418 const std::vector<SUnit> *SUnits;
1419
1420 // SethiUllmanNumbers - The SethiUllman number for each node.
Evan Cheng961bbd32007-01-08 23:50:38 +00001421 std::vector<unsigned> SethiUllmanNumbers;
Evan Chengd38c22b2006-05-11 23:55:42 +00001422
1423 public:
1424 TDRegReductionPriorityQueue() {}
1425
Evan Cheng5924bf72007-09-25 01:54:36 +00001426 void initNodes(DenseMap<SDNode*, std::vector<SUnit*> > &sumap,
Evan Chengfd2c5dd2006-11-04 09:44:31 +00001427 std::vector<SUnit> &sunits) {
1428 SUnitMap = &sumap;
Evan Chengd38c22b2006-05-11 23:55:42 +00001429 SUnits = &sunits;
1430 // Calculate node priorities.
Evan Cheng6730f032007-01-08 23:55:53 +00001431 CalculateSethiUllmanNumbers();
Evan Chengd38c22b2006-05-11 23:55:42 +00001432 }
1433
Evan Cheng5924bf72007-09-25 01:54:36 +00001434 void addNode(const SUnit *SU) {
1435 SethiUllmanNumbers.resize(SUnits->size(), 0);
1436 CalcNodeSethiUllmanNumber(SU);
1437 }
1438
1439 void updateNode(const SUnit *SU) {
1440 SethiUllmanNumbers[SU->NodeNum] = 0;
1441 CalcNodeSethiUllmanNumber(SU);
1442 }
1443
Evan Chengd38c22b2006-05-11 23:55:42 +00001444 void releaseState() {
1445 SUnits = 0;
1446 SethiUllmanNumbers.clear();
1447 }
1448
Evan Cheng6730f032007-01-08 23:55:53 +00001449 unsigned getNodePriority(const SUnit *SU) const {
Evan Cheng961bbd32007-01-08 23:50:38 +00001450 assert(SU->NodeNum < SethiUllmanNumbers.size());
1451 return SethiUllmanNumbers[SU->NodeNum];
Evan Chengd38c22b2006-05-11 23:55:42 +00001452 }
1453
1454 private:
Evan Cheng6730f032007-01-08 23:55:53 +00001455 void CalculateSethiUllmanNumbers();
1456 unsigned CalcNodeSethiUllmanNumber(const SUnit *SU);
Evan Chengd38c22b2006-05-11 23:55:42 +00001457 };
1458}
1459
Evan Chengb9e3db62007-03-14 22:43:40 +00001460/// closestSucc - Returns the scheduled cycle of the successor which is
1461/// closet to the current cycle.
Evan Cheng28748552007-03-13 23:25:11 +00001462static unsigned closestSucc(const SUnit *SU) {
1463 unsigned MaxCycle = 0;
1464 for (SUnit::const_succ_iterator I = SU->Succs.begin(), E = SU->Succs.end();
Evan Chengb9e3db62007-03-14 22:43:40 +00001465 I != E; ++I) {
Evan Cheng0effc3a2007-09-19 01:38:40 +00001466 unsigned Cycle = I->Dep->Cycle;
Evan Chengb9e3db62007-03-14 22:43:40 +00001467 // If there are bunch of CopyToRegs stacked up, they should be considered
1468 // to be at the same position.
Evan Cheng8e136a92007-09-26 21:36:17 +00001469 if (I->Dep->Node && I->Dep->Node->getOpcode() == ISD::CopyToReg)
Evan Cheng0effc3a2007-09-19 01:38:40 +00001470 Cycle = closestSucc(I->Dep)+1;
Evan Chengb9e3db62007-03-14 22:43:40 +00001471 if (Cycle > MaxCycle)
1472 MaxCycle = Cycle;
1473 }
Evan Cheng28748552007-03-13 23:25:11 +00001474 return MaxCycle;
1475}
1476
Evan Cheng61bc51e2007-12-20 02:22:36 +00001477/// calcMaxScratches - Returns an cost estimate of the worse case requirement
1478/// for scratch registers. Live-in operands and live-out results don't count
1479/// since they are "fixed".
1480static unsigned calcMaxScratches(const SUnit *SU) {
1481 unsigned Scratches = 0;
1482 for (SUnit::const_pred_iterator I = SU->Preds.begin(), E = SU->Preds.end();
1483 I != E; ++I) {
1484 if (I->isCtrl) continue; // ignore chain preds
Evan Cheng0e400d42008-01-09 23:01:55 +00001485 if (!I->Dep->Node || I->Dep->Node->getOpcode() != ISD::CopyFromReg)
Evan Cheng61bc51e2007-12-20 02:22:36 +00001486 Scratches++;
1487 }
1488 for (SUnit::const_succ_iterator I = SU->Succs.begin(), E = SU->Succs.end();
1489 I != E; ++I) {
1490 if (I->isCtrl) continue; // ignore chain succs
Evan Cheng0e400d42008-01-09 23:01:55 +00001491 if (!I->Dep->Node || I->Dep->Node->getOpcode() != ISD::CopyToReg)
Evan Cheng61bc51e2007-12-20 02:22:36 +00001492 Scratches += 10;
1493 }
1494 return Scratches;
1495}
1496
Evan Chengd38c22b2006-05-11 23:55:42 +00001497// Bottom up
1498bool bu_ls_rr_sort::operator()(const SUnit *left, const SUnit *right) const {
David Greene4c1e6f32007-06-29 03:42:23 +00001499 // There used to be a special tie breaker here that looked for
David Greene5b6f7552007-06-29 02:48:09 +00001500 // two-address instructions and preferred the instruction with a
1501 // def&use operand. The special case triggered diagnostics when
1502 // _GLIBCXX_DEBUG was enabled because it broke the strict weak
1503 // ordering that priority_queue requires. It didn't help much anyway
1504 // because AddPseudoTwoAddrDeps already covers many of the cases
1505 // where it would have applied. In addition, it's counter-intuitive
1506 // that a tie breaker would be the first thing attempted. There's a
1507 // "real" tie breaker below that is the operation of last resort.
1508 // The fact that the "special tie breaker" would trigger when there
1509 // wasn't otherwise a tie is what broke the strict weak ordering
1510 // constraint.
Evan Cheng99f2f792006-05-13 08:22:24 +00001511
Evan Cheng6730f032007-01-08 23:55:53 +00001512 unsigned LPriority = SPQ->getNodePriority(left);
1513 unsigned RPriority = SPQ->getNodePriority(right);
Evan Cheng73bdf042008-03-01 00:39:47 +00001514 if (LPriority != RPriority)
1515 return LPriority > RPriority;
1516
1517 // Try schedule def + use closer when Sethi-Ullman numbers are the same.
1518 // e.g.
1519 // t1 = op t2, c1
1520 // t3 = op t4, c2
1521 //
1522 // and the following instructions are both ready.
1523 // t2 = op c3
1524 // t4 = op c4
1525 //
1526 // Then schedule t2 = op first.
1527 // i.e.
1528 // t4 = op c4
1529 // t2 = op c3
1530 // t1 = op t2, c1
1531 // t3 = op t4, c2
1532 //
1533 // This creates more short live intervals.
1534 unsigned LDist = closestSucc(left);
1535 unsigned RDist = closestSucc(right);
1536 if (LDist != RDist)
1537 return LDist < RDist;
1538
1539 // Intuitively, it's good to push down instructions whose results are
1540 // liveout so their long live ranges won't conflict with other values
1541 // which are needed inside the BB. Further prioritize liveout instructions
1542 // by the number of operands which are calculated within the BB.
1543 unsigned LScratch = calcMaxScratches(left);
1544 unsigned RScratch = calcMaxScratches(right);
1545 if (LScratch != RScratch)
1546 return LScratch > RScratch;
1547
1548 if (left->Height != right->Height)
1549 return left->Height > right->Height;
1550
1551 if (left->Depth != right->Depth)
1552 return left->Depth < right->Depth;
1553
1554 if (left->CycleBound != right->CycleBound)
1555 return left->CycleBound > right->CycleBound;
1556
1557 // FIXME: No strict ordering.
Evan Chengd38c22b2006-05-11 23:55:42 +00001558 return false;
1559}
1560
Evan Cheng73bdf042008-03-01 00:39:47 +00001561template<class SF> bool
1562BURegReductionPriorityQueue<SF>::canClobber(const SUnit *SU, const SUnit *Op) {
Evan Chengfd2c5dd2006-11-04 09:44:31 +00001563 if (SU->isTwoAddress) {
1564 unsigned Opc = SU->Node->getTargetOpcode();
Chris Lattner03ad8852008-01-07 07:27:27 +00001565 const TargetInstrDesc &TID = TII->get(Opc);
Chris Lattnerfd2e3382008-01-07 06:47:00 +00001566 unsigned NumRes = TID.getNumDefs();
Dan Gohman0340d1e2008-02-15 20:50:13 +00001567 unsigned NumOps = TID.getNumOperands() - NumRes;
Evan Chengfd2c5dd2006-11-04 09:44:31 +00001568 for (unsigned i = 0; i != NumOps; ++i) {
Chris Lattnerfd2e3382008-01-07 06:47:00 +00001569 if (TID.getOperandConstraint(i+NumRes, TOI::TIED_TO) != -1) {
Evan Chengfd2c5dd2006-11-04 09:44:31 +00001570 SDNode *DU = SU->Node->getOperand(i).Val;
Evan Cheng1bf166312007-11-09 01:27:11 +00001571 if ((*SUnitMap).find(DU) != (*SUnitMap).end() &&
1572 Op == (*SUnitMap)[DU][SU->InstanceNo])
Evan Chengfd2c5dd2006-11-04 09:44:31 +00001573 return true;
1574 }
1575 }
Evan Chengd38c22b2006-05-11 23:55:42 +00001576 }
Evan Chengd38c22b2006-05-11 23:55:42 +00001577 return false;
1578}
1579
Evan Chengfd2c5dd2006-11-04 09:44:31 +00001580
Evan Chenga5e595d2007-09-28 22:32:30 +00001581/// hasCopyToRegUse - Return true if SU has a value successor that is a
1582/// CopyToReg node.
1583static bool hasCopyToRegUse(SUnit *SU) {
1584 for (SUnit::const_succ_iterator I = SU->Succs.begin(), E = SU->Succs.end();
1585 I != E; ++I) {
1586 if (I->isCtrl) continue;
1587 SUnit *SuccSU = I->Dep;
1588 if (SuccSU->Node && SuccSU->Node->getOpcode() == ISD::CopyToReg)
1589 return true;
1590 }
1591 return false;
1592}
1593
Evan Chengf9891412007-12-20 09:25:31 +00001594/// canClobberPhysRegDefs - True if SU would clobber one of SuccSU's
1595/// physical register def.
1596static bool canClobberPhysRegDefs(SUnit *SuccSU, SUnit *SU,
1597 const TargetInstrInfo *TII,
Dan Gohman3a4be0f2008-02-10 18:45:23 +00001598 const TargetRegisterInfo *TRI) {
Evan Chengf9891412007-12-20 09:25:31 +00001599 SDNode *N = SuccSU->Node;
Chris Lattnerb0d06b42008-01-07 03:13:06 +00001600 unsigned NumDefs = TII->get(N->getTargetOpcode()).getNumDefs();
1601 const unsigned *ImpDefs = TII->get(N->getTargetOpcode()).getImplicitDefs();
Evan Chengf9891412007-12-20 09:25:31 +00001602 if (!ImpDefs)
1603 return false;
Chris Lattnerb0d06b42008-01-07 03:13:06 +00001604 const unsigned *SUImpDefs =
1605 TII->get(SU->Node->getTargetOpcode()).getImplicitDefs();
Evan Chengf9891412007-12-20 09:25:31 +00001606 if (!SUImpDefs)
1607 return false;
1608 for (unsigned i = NumDefs, e = N->getNumValues(); i != e; ++i) {
1609 MVT::ValueType VT = N->getValueType(i);
1610 if (VT == MVT::Flag || VT == MVT::Other)
1611 continue;
1612 unsigned Reg = ImpDefs[i - NumDefs];
1613 for (;*SUImpDefs; ++SUImpDefs) {
1614 unsigned SUReg = *SUImpDefs;
Dan Gohman3a4be0f2008-02-10 18:45:23 +00001615 if (TRI->regsOverlap(Reg, SUReg))
Evan Chengf9891412007-12-20 09:25:31 +00001616 return true;
1617 }
1618 }
1619 return false;
1620}
1621
Evan Chengd38c22b2006-05-11 23:55:42 +00001622/// AddPseudoTwoAddrDeps - If two nodes share an operand and one of them uses
1623/// it as a def&use operand. Add a pseudo control edge from it to the other
1624/// node (if it won't create a cycle) so the two-address one will be scheduled
Evan Chenga5e595d2007-09-28 22:32:30 +00001625/// first (lower in the schedule). If both nodes are two-address, favor the
1626/// one that has a CopyToReg use (more likely to be a loop induction update).
1627/// If both are two-address, but one is commutable while the other is not
1628/// commutable, favor the one that's not commutable.
Evan Chengd38c22b2006-05-11 23:55:42 +00001629template<class SF>
1630void BURegReductionPriorityQueue<SF>::AddPseudoTwoAddrDeps() {
Evan Chengfd2c5dd2006-11-04 09:44:31 +00001631 for (unsigned i = 0, e = SUnits->size(); i != e; ++i) {
1632 SUnit *SU = (SUnit *)&((*SUnits)[i]);
1633 if (!SU->isTwoAddress)
1634 continue;
1635
1636 SDNode *Node = SU->Node;
Evan Chenga5e595d2007-09-28 22:32:30 +00001637 if (!Node || !Node->isTargetOpcode() || SU->FlaggedNodes.size() > 0)
Evan Chengfd2c5dd2006-11-04 09:44:31 +00001638 continue;
1639
1640 unsigned Opc = Node->getTargetOpcode();
Chris Lattner03ad8852008-01-07 07:27:27 +00001641 const TargetInstrDesc &TID = TII->get(Opc);
Chris Lattnerfd2e3382008-01-07 06:47:00 +00001642 unsigned NumRes = TID.getNumDefs();
Dan Gohman0340d1e2008-02-15 20:50:13 +00001643 unsigned NumOps = TID.getNumOperands() - NumRes;
Evan Chengfd2c5dd2006-11-04 09:44:31 +00001644 for (unsigned j = 0; j != NumOps; ++j) {
Chris Lattnerfd2e3382008-01-07 06:47:00 +00001645 if (TID.getOperandConstraint(j+NumRes, TOI::TIED_TO) != -1) {
Evan Chengfd2c5dd2006-11-04 09:44:31 +00001646 SDNode *DU = SU->Node->getOperand(j).Val;
Evan Cheng1bf166312007-11-09 01:27:11 +00001647 if ((*SUnitMap).find(DU) == (*SUnitMap).end())
1648 continue;
Evan Cheng5924bf72007-09-25 01:54:36 +00001649 SUnit *DUSU = (*SUnitMap)[DU][SU->InstanceNo];
Evan Chengf24d15f2006-11-06 21:33:46 +00001650 if (!DUSU) continue;
Evan Chengfd2c5dd2006-11-04 09:44:31 +00001651 for (SUnit::succ_iterator I = DUSU->Succs.begin(),E = DUSU->Succs.end();
1652 I != E; ++I) {
Evan Cheng0effc3a2007-09-19 01:38:40 +00001653 if (I->isCtrl) continue;
1654 SUnit *SuccSU = I->Dep;
Evan Chengf9891412007-12-20 09:25:31 +00001655 if (SuccSU == SU)
Evan Cheng5924bf72007-09-25 01:54:36 +00001656 continue;
Evan Cheng2dbffa42007-11-06 08:44:59 +00001657 // Be conservative. Ignore if nodes aren't at roughly the same
1658 // depth and height.
1659 if (SuccSU->Height < SU->Height && (SU->Height - SuccSU->Height) > 1)
1660 continue;
Evan Chengaa2d6ef2007-10-12 08:50:34 +00001661 if (!SuccSU->Node || !SuccSU->Node->isTargetOpcode())
1662 continue;
Evan Chengf9891412007-12-20 09:25:31 +00001663 // Don't constrain nodes with physical register defs if the
Dan Gohmancf8827a2008-01-29 12:43:50 +00001664 // predecessor can clobber them.
Evan Chengf9891412007-12-20 09:25:31 +00001665 if (SuccSU->hasPhysRegDefs) {
Dan Gohman3a4be0f2008-02-10 18:45:23 +00001666 if (canClobberPhysRegDefs(SuccSU, SU, TII, TRI))
Evan Chengf9891412007-12-20 09:25:31 +00001667 continue;
1668 }
Evan Chengaa2d6ef2007-10-12 08:50:34 +00001669 // Don't constraint extract_subreg / insert_subreg these may be
1670 // coalesced away. We don't them close to their uses.
1671 unsigned SuccOpc = SuccSU->Node->getTargetOpcode();
1672 if (SuccOpc == TargetInstrInfo::EXTRACT_SUBREG ||
1673 SuccOpc == TargetInstrInfo::INSERT_SUBREG)
1674 continue;
Evan Cheng5924bf72007-09-25 01:54:36 +00001675 if ((!canClobber(SuccSU, DUSU) ||
Evan Chenga5e595d2007-09-28 22:32:30 +00001676 (hasCopyToRegUse(SU) && !hasCopyToRegUse(SuccSU)) ||
Evan Cheng5924bf72007-09-25 01:54:36 +00001677 (!SU->isCommutable && SuccSU->isCommutable)) &&
Roman Levenstein7e71b4b2008-03-26 09:18:09 +00001678 !scheduleDAG->IsReachable(SuccSU, SU)) {
Evan Cheng5924bf72007-09-25 01:54:36 +00001679 DOUT << "Adding an edge from SU # " << SU->NodeNum
1680 << " to SU #" << SuccSU->NodeNum << "\n";
Roman Levenstein7e71b4b2008-03-26 09:18:09 +00001681 scheduleDAG->AddPred(SU, SuccSU, true, true);
Evan Chengfd2c5dd2006-11-04 09:44:31 +00001682 }
1683 }
1684 }
1685 }
1686 }
Evan Chengd38c22b2006-05-11 23:55:42 +00001687}
1688
Evan Cheng6730f032007-01-08 23:55:53 +00001689/// CalcNodeSethiUllmanNumber - Priority is the Sethi Ullman number.
Evan Chengd38c22b2006-05-11 23:55:42 +00001690/// Smaller number is the higher priority.
1691template<class SF>
Chris Lattner296a83c2007-02-01 04:55:59 +00001692unsigned BURegReductionPriorityQueue<SF>::
1693CalcNodeSethiUllmanNumber(const SUnit *SU) {
Evan Cheng961bbd32007-01-08 23:50:38 +00001694 unsigned &SethiUllmanNumber = SethiUllmanNumbers[SU->NodeNum];
Evan Chengd38c22b2006-05-11 23:55:42 +00001695 if (SethiUllmanNumber != 0)
1696 return SethiUllmanNumber;
1697
Evan Cheng961bbd32007-01-08 23:50:38 +00001698 unsigned Extra = 0;
1699 for (SUnit::const_pred_iterator I = SU->Preds.begin(), E = SU->Preds.end();
1700 I != E; ++I) {
Evan Cheng0effc3a2007-09-19 01:38:40 +00001701 if (I->isCtrl) continue; // ignore chain preds
1702 SUnit *PredSU = I->Dep;
Evan Cheng6730f032007-01-08 23:55:53 +00001703 unsigned PredSethiUllman = CalcNodeSethiUllmanNumber(PredSU);
Evan Cheng961bbd32007-01-08 23:50:38 +00001704 if (PredSethiUllman > SethiUllmanNumber) {
1705 SethiUllmanNumber = PredSethiUllman;
1706 Extra = 0;
Evan Cheng0effc3a2007-09-19 01:38:40 +00001707 } else if (PredSethiUllman == SethiUllmanNumber && !I->isCtrl)
Evan Cheng5924bf72007-09-25 01:54:36 +00001708 ++Extra;
Evan Chengd38c22b2006-05-11 23:55:42 +00001709 }
Evan Cheng961bbd32007-01-08 23:50:38 +00001710
1711 SethiUllmanNumber += Extra;
1712
1713 if (SethiUllmanNumber == 0)
1714 SethiUllmanNumber = 1;
Evan Chengd38c22b2006-05-11 23:55:42 +00001715
1716 return SethiUllmanNumber;
1717}
1718
Evan Cheng6730f032007-01-08 23:55:53 +00001719/// CalculateSethiUllmanNumbers - Calculate Sethi-Ullman numbers of all
1720/// scheduling units.
Evan Chengd38c22b2006-05-11 23:55:42 +00001721template<class SF>
Evan Cheng6730f032007-01-08 23:55:53 +00001722void BURegReductionPriorityQueue<SF>::CalculateSethiUllmanNumbers() {
Evan Chengd38c22b2006-05-11 23:55:42 +00001723 SethiUllmanNumbers.assign(SUnits->size(), 0);
1724
1725 for (unsigned i = 0, e = SUnits->size(); i != e; ++i)
Evan Cheng6730f032007-01-08 23:55:53 +00001726 CalcNodeSethiUllmanNumber(&(*SUnits)[i]);
Evan Chengd38c22b2006-05-11 23:55:42 +00001727}
1728
Roman Levenstein30d09512008-03-27 09:44:37 +00001729/// LimitedSumOfUnscheduledPredsOfSuccs - Compute the sum of the unscheduled
Roman Levensteinbc674502008-03-27 09:14:57 +00001730/// predecessors of the successors of the SUnit SU. Stop when the provided
1731/// limit is exceeded.
Roman Levensteinbc674502008-03-27 09:14:57 +00001732static unsigned LimitedSumOfUnscheduledPredsOfSuccs(const SUnit *SU,
1733 unsigned Limit) {
1734 unsigned Sum = 0;
1735 for (SUnit::const_succ_iterator I = SU->Succs.begin(), E = SU->Succs.end();
1736 I != E; ++I) {
1737 SUnit *SuccSU = I->Dep;
1738 for (SUnit::const_pred_iterator II = SuccSU->Preds.begin(),
1739 EE = SuccSU->Preds.end(); II != EE; ++II) {
1740 SUnit *PredSU = II->Dep;
Evan Cheng16d72072008-03-29 18:34:22 +00001741 if (!PredSU->isScheduled)
1742 if (++Sum > Limit)
1743 return Sum;
Roman Levensteinbc674502008-03-27 09:14:57 +00001744 }
1745 }
1746 return Sum;
1747}
1748
Evan Chengd38c22b2006-05-11 23:55:42 +00001749
1750// Top down
1751bool td_ls_rr_sort::operator()(const SUnit *left, const SUnit *right) const {
Evan Cheng6730f032007-01-08 23:55:53 +00001752 unsigned LPriority = SPQ->getNodePriority(left);
1753 unsigned RPriority = SPQ->getNodePriority(right);
Evan Cheng8e136a92007-09-26 21:36:17 +00001754 bool LIsTarget = left->Node && left->Node->isTargetOpcode();
1755 bool RIsTarget = right->Node && right->Node->isTargetOpcode();
Evan Chengd38c22b2006-05-11 23:55:42 +00001756 bool LIsFloater = LIsTarget && left->NumPreds == 0;
1757 bool RIsFloater = RIsTarget && right->NumPreds == 0;
Roman Levensteinbc674502008-03-27 09:14:57 +00001758 unsigned LBonus = (LimitedSumOfUnscheduledPredsOfSuccs(left,1) == 1) ? 2 : 0;
1759 unsigned RBonus = (LimitedSumOfUnscheduledPredsOfSuccs(right,1) == 1) ? 2 : 0;
Evan Chengd38c22b2006-05-11 23:55:42 +00001760
1761 if (left->NumSuccs == 0 && right->NumSuccs != 0)
1762 return false;
1763 else if (left->NumSuccs != 0 && right->NumSuccs == 0)
1764 return true;
1765
Evan Chengd38c22b2006-05-11 23:55:42 +00001766 if (LIsFloater)
1767 LBonus -= 2;
1768 if (RIsFloater)
1769 RBonus -= 2;
1770 if (left->NumSuccs == 1)
1771 LBonus += 2;
1772 if (right->NumSuccs == 1)
1773 RBonus += 2;
1774
Evan Cheng73bdf042008-03-01 00:39:47 +00001775 if (LPriority+LBonus != RPriority+RBonus)
1776 return LPriority+LBonus < RPriority+RBonus;
Anton Korobeynikov035eaac2008-02-20 11:10:28 +00001777
Evan Cheng73bdf042008-03-01 00:39:47 +00001778 if (left->Depth != right->Depth)
1779 return left->Depth < right->Depth;
1780
1781 if (left->NumSuccsLeft != right->NumSuccsLeft)
1782 return left->NumSuccsLeft > right->NumSuccsLeft;
1783
1784 if (left->CycleBound != right->CycleBound)
1785 return left->CycleBound > right->CycleBound;
1786
1787 // FIXME: No strict ordering.
Evan Chengd38c22b2006-05-11 23:55:42 +00001788 return false;
1789}
1790
Evan Cheng6730f032007-01-08 23:55:53 +00001791/// CalcNodeSethiUllmanNumber - Priority is the Sethi Ullman number.
Evan Chengd38c22b2006-05-11 23:55:42 +00001792/// Smaller number is the higher priority.
1793template<class SF>
Chris Lattner296a83c2007-02-01 04:55:59 +00001794unsigned TDRegReductionPriorityQueue<SF>::
1795CalcNodeSethiUllmanNumber(const SUnit *SU) {
Evan Cheng961bbd32007-01-08 23:50:38 +00001796 unsigned &SethiUllmanNumber = SethiUllmanNumbers[SU->NodeNum];
Evan Chengd38c22b2006-05-11 23:55:42 +00001797 if (SethiUllmanNumber != 0)
1798 return SethiUllmanNumber;
1799
Evan Cheng8e136a92007-09-26 21:36:17 +00001800 unsigned Opc = SU->Node ? SU->Node->getOpcode() : 0;
Evan Chengd38c22b2006-05-11 23:55:42 +00001801 if (Opc == ISD::TokenFactor || Opc == ISD::CopyToReg)
Evan Cheng961bbd32007-01-08 23:50:38 +00001802 SethiUllmanNumber = 0xffff;
Evan Chengd38c22b2006-05-11 23:55:42 +00001803 else if (SU->NumSuccsLeft == 0)
1804 // If SU does not have a use, i.e. it doesn't produce a value that would
1805 // be consumed (e.g. store), then it terminates a chain of computation.
Chris Lattner296a83c2007-02-01 04:55:59 +00001806 // Give it a small SethiUllman number so it will be scheduled right before
1807 // its predecessors that it doesn't lengthen their live ranges.
Evan Cheng961bbd32007-01-08 23:50:38 +00001808 SethiUllmanNumber = 0;
Evan Chengd38c22b2006-05-11 23:55:42 +00001809 else if (SU->NumPredsLeft == 0 &&
1810 (Opc != ISD::CopyFromReg || isCopyFromLiveIn(SU)))
Evan Cheng961bbd32007-01-08 23:50:38 +00001811 SethiUllmanNumber = 0xffff;
Evan Chengd38c22b2006-05-11 23:55:42 +00001812 else {
1813 int Extra = 0;
Chris Lattnerd86418a2006-08-17 00:09:56 +00001814 for (SUnit::const_pred_iterator I = SU->Preds.begin(), E = SU->Preds.end();
1815 I != E; ++I) {
Evan Cheng0effc3a2007-09-19 01:38:40 +00001816 if (I->isCtrl) continue; // ignore chain preds
1817 SUnit *PredSU = I->Dep;
Evan Cheng6730f032007-01-08 23:55:53 +00001818 unsigned PredSethiUllman = CalcNodeSethiUllmanNumber(PredSU);
Evan Chengd38c22b2006-05-11 23:55:42 +00001819 if (PredSethiUllman > SethiUllmanNumber) {
1820 SethiUllmanNumber = PredSethiUllman;
1821 Extra = 0;
Evan Cheng0effc3a2007-09-19 01:38:40 +00001822 } else if (PredSethiUllman == SethiUllmanNumber && !I->isCtrl)
Evan Cheng5924bf72007-09-25 01:54:36 +00001823 ++Extra;
Evan Chengd38c22b2006-05-11 23:55:42 +00001824 }
1825
1826 SethiUllmanNumber += Extra;
1827 }
1828
1829 return SethiUllmanNumber;
1830}
1831
Evan Cheng6730f032007-01-08 23:55:53 +00001832/// CalculateSethiUllmanNumbers - Calculate Sethi-Ullman numbers of all
1833/// scheduling units.
Evan Chengd38c22b2006-05-11 23:55:42 +00001834template<class SF>
Evan Cheng6730f032007-01-08 23:55:53 +00001835void TDRegReductionPriorityQueue<SF>::CalculateSethiUllmanNumbers() {
Evan Chengd38c22b2006-05-11 23:55:42 +00001836 SethiUllmanNumbers.assign(SUnits->size(), 0);
1837
1838 for (unsigned i = 0, e = SUnits->size(); i != e; ++i)
Evan Cheng6730f032007-01-08 23:55:53 +00001839 CalcNodeSethiUllmanNumber(&(*SUnits)[i]);
Evan Chengd38c22b2006-05-11 23:55:42 +00001840}
1841
1842//===----------------------------------------------------------------------===//
1843// Public Constructor Functions
1844//===----------------------------------------------------------------------===//
1845
Jim Laskey03593f72006-08-01 18:29:48 +00001846llvm::ScheduleDAG* llvm::createBURRListDAGScheduler(SelectionDAGISel *IS,
1847 SelectionDAG *DAG,
Evan Chengd38c22b2006-05-11 23:55:42 +00001848 MachineBasicBlock *BB) {
Evan Chengfd2c5dd2006-11-04 09:44:31 +00001849 const TargetInstrInfo *TII = DAG->getTarget().getInstrInfo();
Dan Gohman3a4be0f2008-02-10 18:45:23 +00001850 const TargetRegisterInfo *TRI = DAG->getTarget().getRegisterInfo();
Roman Levenstein7e71b4b2008-03-26 09:18:09 +00001851
1852 BURegReductionPriorityQueue<bu_ls_rr_sort> *priorityQueue =
1853 new BURegReductionPriorityQueue<bu_ls_rr_sort>(TII, TRI);
1854
1855 ScheduleDAGRRList * scheduleDAG =
1856 new ScheduleDAGRRList(*DAG, BB, DAG->getTarget(), true, priorityQueue);
1857 priorityQueue->setScheduleDAG(scheduleDAG);
1858 return scheduleDAG;
Evan Chengd38c22b2006-05-11 23:55:42 +00001859}
1860
Jim Laskey03593f72006-08-01 18:29:48 +00001861llvm::ScheduleDAG* llvm::createTDRRListDAGScheduler(SelectionDAGISel *IS,
1862 SelectionDAG *DAG,
Evan Chengd38c22b2006-05-11 23:55:42 +00001863 MachineBasicBlock *BB) {
Jim Laskey95eda5b2006-08-01 14:21:23 +00001864 return new ScheduleDAGRRList(*DAG, BB, DAG->getTarget(), false,
Chris Lattner296a83c2007-02-01 04:55:59 +00001865 new TDRegReductionPriorityQueue<td_ls_rr_sort>());
Evan Chengd38c22b2006-05-11 23:55:42 +00001866}
1867