Dan Gohman | 343f0c0 | 2008-11-19 23:18:57 +0000 | [diff] [blame] | 1 | //===--- ScheduleDAGSDNodes.cpp - Implement the ScheduleDAGSDNodes class --===// |
| 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
| 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
| 9 | // |
| 10 | // This implements the ScheduleDAG class, which is a base class used by |
| 11 | // scheduling implementation classes. |
| 12 | // |
| 13 | //===----------------------------------------------------------------------===// |
| 14 | |
| 15 | #define DEBUG_TYPE "pre-RA-sched" |
Evan Cheng | a8efe28 | 2010-03-14 19:56:39 +0000 | [diff] [blame] | 16 | #include "SDNodeDbgValue.h" |
Dan Gohman | 84fbac5 | 2009-02-06 17:22:58 +0000 | [diff] [blame] | 17 | #include "ScheduleDAGSDNodes.h" |
Dan Gohman | bcea859 | 2009-10-10 01:32:21 +0000 | [diff] [blame] | 18 | #include "InstrEmitter.h" |
Dan Gohman | 343f0c0 | 2008-11-19 23:18:57 +0000 | [diff] [blame] | 19 | #include "llvm/CodeGen/SelectionDAG.h" |
| 20 | #include "llvm/Target/TargetMachine.h" |
| 21 | #include "llvm/Target/TargetInstrInfo.h" |
Evan Cheng | 1cc3984 | 2010-05-20 23:26:43 +0000 | [diff] [blame] | 22 | #include "llvm/Target/TargetLowering.h" |
Dan Gohman | 343f0c0 | 2008-11-19 23:18:57 +0000 | [diff] [blame] | 23 | #include "llvm/Target/TargetRegisterInfo.h" |
David Goodwin | 7104616 | 2009-08-13 16:05:04 +0000 | [diff] [blame] | 24 | #include "llvm/Target/TargetSubtarget.h" |
Evan Cheng | c589e03 | 2010-01-22 03:36:51 +0000 | [diff] [blame] | 25 | #include "llvm/ADT/DenseMap.h" |
| 26 | #include "llvm/ADT/SmallPtrSet.h" |
Evan Cheng | bfcb305 | 2010-03-25 01:38:16 +0000 | [diff] [blame] | 27 | #include "llvm/ADT/SmallSet.h" |
Evan Cheng | c589e03 | 2010-01-22 03:36:51 +0000 | [diff] [blame] | 28 | #include "llvm/ADT/SmallVector.h" |
| 29 | #include "llvm/ADT/Statistic.h" |
Andrew Trick | e0ef509 | 2011-03-05 08:00:22 +0000 | [diff] [blame] | 30 | #include "llvm/Support/CommandLine.h" |
Dan Gohman | 343f0c0 | 2008-11-19 23:18:57 +0000 | [diff] [blame] | 31 | #include "llvm/Support/Debug.h" |
| 32 | #include "llvm/Support/raw_ostream.h" |
| 33 | using namespace llvm; |
| 34 | |
Evan Cheng | c589e03 | 2010-01-22 03:36:51 +0000 | [diff] [blame] | 35 | STATISTIC(LoadsClustered, "Number of loads clustered together"); |
| 36 | |
Andrew Trick | e0ef509 | 2011-03-05 08:00:22 +0000 | [diff] [blame] | 37 | // This allows latency based scheduler to notice high latency instructions |
| 38 | // without a target itinerary. The choise if number here has more to do with |
| 39 | // balancing scheduler heursitics than with the actual machine latency. |
| 40 | static cl::opt<int> HighLatencyCycles( |
| 41 | "sched-high-latency-cycles", cl::Hidden, cl::init(10), |
| 42 | cl::desc("Roughly estimate the number of cycles that 'long latency'" |
| 43 | "instructions take for targets with no itinerary")); |
| 44 | |
Dan Gohman | 79ce276 | 2009-01-15 19:20:50 +0000 | [diff] [blame] | 45 | ScheduleDAGSDNodes::ScheduleDAGSDNodes(MachineFunction &mf) |
Evan Cheng | 3ef1c87 | 2010-09-10 01:29:16 +0000 | [diff] [blame] | 46 | : ScheduleDAG(mf), |
| 47 | InstrItins(mf.getTarget().getInstrItineraryData()) {} |
Dan Gohman | 343f0c0 | 2008-11-19 23:18:57 +0000 | [diff] [blame] | 48 | |
Dan Gohman | 47ac0f0 | 2009-02-11 04:27:20 +0000 | [diff] [blame] | 49 | /// Run - perform scheduling. |
| 50 | /// |
| 51 | void ScheduleDAGSDNodes::Run(SelectionDAG *dag, MachineBasicBlock *bb, |
| 52 | MachineBasicBlock::iterator insertPos) { |
| 53 | DAG = dag; |
| 54 | ScheduleDAG::Run(bb, insertPos); |
| 55 | } |
| 56 | |
Evan Cheng | 1cc3984 | 2010-05-20 23:26:43 +0000 | [diff] [blame] | 57 | /// NewSUnit - Creates a new SUnit and return a ptr to it. |
| 58 | /// |
| 59 | SUnit *ScheduleDAGSDNodes::NewSUnit(SDNode *N) { |
| 60 | #ifndef NDEBUG |
| 61 | const SUnit *Addr = 0; |
| 62 | if (!SUnits.empty()) |
| 63 | Addr = &SUnits[0]; |
| 64 | #endif |
| 65 | SUnits.push_back(SUnit(N, (unsigned)SUnits.size())); |
| 66 | assert((Addr == 0 || Addr == &SUnits[0]) && |
| 67 | "SUnits std::vector reallocated on the fly!"); |
| 68 | SUnits.back().OrigNode = &SUnits.back(); |
| 69 | SUnit *SU = &SUnits.back(); |
| 70 | const TargetLowering &TLI = DAG->getTargetLoweringInfo(); |
Evan Cheng | c120af4 | 2010-08-10 02:39:45 +0000 | [diff] [blame] | 71 | if (!N || |
| 72 | (N->isMachineOpcode() && |
| 73 | N->getMachineOpcode() == TargetOpcode::IMPLICIT_DEF)) |
Evan Cheng | 046fa3f | 2010-05-28 23:26:21 +0000 | [diff] [blame] | 74 | SU->SchedulingPref = Sched::None; |
| 75 | else |
| 76 | SU->SchedulingPref = TLI.getSchedulingPreference(N); |
Evan Cheng | 1cc3984 | 2010-05-20 23:26:43 +0000 | [diff] [blame] | 77 | return SU; |
| 78 | } |
| 79 | |
Dan Gohman | 343f0c0 | 2008-11-19 23:18:57 +0000 | [diff] [blame] | 80 | SUnit *ScheduleDAGSDNodes::Clone(SUnit *Old) { |
| 81 | SUnit *SU = NewSUnit(Old->getNode()); |
| 82 | SU->OrigNode = Old->OrigNode; |
| 83 | SU->Latency = Old->Latency; |
Andrew Trick | 5469976 | 2011-04-07 19:54:57 +0000 | [diff] [blame] | 84 | SU->isVRegCycle = Old->isVRegCycle; |
Evan Cheng | 8239daf | 2010-11-03 00:45:17 +0000 | [diff] [blame] | 85 | SU->isCall = Old->isCall; |
Dan Gohman | 343f0c0 | 2008-11-19 23:18:57 +0000 | [diff] [blame] | 86 | SU->isTwoAddress = Old->isTwoAddress; |
| 87 | SU->isCommutable = Old->isCommutable; |
| 88 | SU->hasPhysRegDefs = Old->hasPhysRegDefs; |
Dan Gohman | 3974667 | 2009-03-23 16:10:52 +0000 | [diff] [blame] | 89 | SU->hasPhysRegClobbers = Old->hasPhysRegClobbers; |
Evan Cheng | 1cc3984 | 2010-05-20 23:26:43 +0000 | [diff] [blame] | 90 | SU->SchedulingPref = Old->SchedulingPref; |
Evan Cheng | e57187c | 2009-01-16 20:57:18 +0000 | [diff] [blame] | 91 | Old->isCloned = true; |
Dan Gohman | 343f0c0 | 2008-11-19 23:18:57 +0000 | [diff] [blame] | 92 | return SU; |
| 93 | } |
| 94 | |
| 95 | /// CheckForPhysRegDependency - Check if the dependency between def and use of |
| 96 | /// a specified operand is a physical register dependency. If so, returns the |
Evan Cheng | c29a56d | 2009-01-12 03:19:55 +0000 | [diff] [blame] | 97 | /// register and the cost of copying the register. |
Dan Gohman | 343f0c0 | 2008-11-19 23:18:57 +0000 | [diff] [blame] | 98 | static void CheckForPhysRegDependency(SDNode *Def, SDNode *User, unsigned Op, |
Andrew Trick | cd5af07 | 2011-02-03 23:00:17 +0000 | [diff] [blame] | 99 | const TargetRegisterInfo *TRI, |
Dan Gohman | 343f0c0 | 2008-11-19 23:18:57 +0000 | [diff] [blame] | 100 | const TargetInstrInfo *TII, |
Evan Cheng | c29a56d | 2009-01-12 03:19:55 +0000 | [diff] [blame] | 101 | unsigned &PhysReg, int &Cost) { |
Dan Gohman | 343f0c0 | 2008-11-19 23:18:57 +0000 | [diff] [blame] | 102 | if (Op != 2 || User->getOpcode() != ISD::CopyToReg) |
| 103 | return; |
| 104 | |
| 105 | unsigned Reg = cast<RegisterSDNode>(User->getOperand(1))->getReg(); |
| 106 | if (TargetRegisterInfo::isVirtualRegister(Reg)) |
| 107 | return; |
| 108 | |
| 109 | unsigned ResNo = User->getOperand(2).getResNo(); |
| 110 | if (Def->isMachineOpcode()) { |
| 111 | const TargetInstrDesc &II = TII->get(Def->getMachineOpcode()); |
| 112 | if (ResNo >= II.getNumDefs() && |
Evan Cheng | c29a56d | 2009-01-12 03:19:55 +0000 | [diff] [blame] | 113 | II.ImplicitDefs[ResNo - II.getNumDefs()] == Reg) { |
Dan Gohman | 343f0c0 | 2008-11-19 23:18:57 +0000 | [diff] [blame] | 114 | PhysReg = Reg; |
Evan Cheng | c29a56d | 2009-01-12 03:19:55 +0000 | [diff] [blame] | 115 | const TargetRegisterClass *RC = |
Rafael Espindola | d31f972 | 2010-06-29 14:02:34 +0000 | [diff] [blame] | 116 | TRI->getMinimalPhysRegClass(Reg, Def->getValueType(ResNo)); |
Evan Cheng | c29a56d | 2009-01-12 03:19:55 +0000 | [diff] [blame] | 117 | Cost = RC->getCopyCost(); |
| 118 | } |
Dan Gohman | 343f0c0 | 2008-11-19 23:18:57 +0000 | [diff] [blame] | 119 | } |
| 120 | } |
| 121 | |
Chris Lattner | 29d8f0c | 2010-12-23 17:24:32 +0000 | [diff] [blame] | 122 | static void AddGlue(SDNode *N, SDValue Glue, bool AddGlue, SelectionDAG *DAG) { |
Evan Cheng | c589e03 | 2010-01-22 03:36:51 +0000 | [diff] [blame] | 123 | SmallVector<EVT, 4> VTs; |
Chris Lattner | 29d8f0c | 2010-12-23 17:24:32 +0000 | [diff] [blame] | 124 | SDNode *GlueDestNode = Glue.getNode(); |
Bill Wendling | 151d26d | 2010-06-23 18:16:24 +0000 | [diff] [blame] | 125 | |
Chris Lattner | 29d8f0c | 2010-12-23 17:24:32 +0000 | [diff] [blame] | 126 | // Don't add glue from a node to itself. |
| 127 | if (GlueDestNode == N) return; |
Bill Wendling | 10707f3 | 2010-06-24 22:00:37 +0000 | [diff] [blame] | 128 | |
Chris Lattner | 29d8f0c | 2010-12-23 17:24:32 +0000 | [diff] [blame] | 129 | // Don't add glue to something which already has glue. |
Chris Lattner | f1b4eaf | 2010-12-21 02:38:05 +0000 | [diff] [blame] | 130 | if (N->getValueType(N->getNumValues() - 1) == MVT::Glue) return; |
Bill Wendling | 10707f3 | 2010-06-24 22:00:37 +0000 | [diff] [blame] | 131 | |
| 132 | for (unsigned I = 0, E = N->getNumValues(); I != E; ++I) |
| 133 | VTs.push_back(N->getValueType(I)); |
Bill Wendling | 151d26d | 2010-06-23 18:16:24 +0000 | [diff] [blame] | 134 | |
Chris Lattner | 29d8f0c | 2010-12-23 17:24:32 +0000 | [diff] [blame] | 135 | if (AddGlue) |
Chris Lattner | f1b4eaf | 2010-12-21 02:38:05 +0000 | [diff] [blame] | 136 | VTs.push_back(MVT::Glue); |
Bill Wendling | 151d26d | 2010-06-23 18:16:24 +0000 | [diff] [blame] | 137 | |
Evan Cheng | c589e03 | 2010-01-22 03:36:51 +0000 | [diff] [blame] | 138 | SmallVector<SDValue, 4> Ops; |
Bill Wendling | 10707f3 | 2010-06-24 22:00:37 +0000 | [diff] [blame] | 139 | for (unsigned I = 0, E = N->getNumOperands(); I != E; ++I) |
| 140 | Ops.push_back(N->getOperand(I)); |
Bill Wendling | 151d26d | 2010-06-23 18:16:24 +0000 | [diff] [blame] | 141 | |
Chris Lattner | 29d8f0c | 2010-12-23 17:24:32 +0000 | [diff] [blame] | 142 | if (GlueDestNode) |
| 143 | Ops.push_back(Glue); |
Bill Wendling | 151d26d | 2010-06-23 18:16:24 +0000 | [diff] [blame] | 144 | |
Evan Cheng | c589e03 | 2010-01-22 03:36:51 +0000 | [diff] [blame] | 145 | SDVTList VTList = DAG->getVTList(&VTs[0], VTs.size()); |
Bill Wendling | 151d26d | 2010-06-23 18:16:24 +0000 | [diff] [blame] | 146 | MachineSDNode::mmo_iterator Begin = 0, End = 0; |
| 147 | MachineSDNode *MN = dyn_cast<MachineSDNode>(N); |
| 148 | |
| 149 | // Store memory references. |
| 150 | if (MN) { |
| 151 | Begin = MN->memoperands_begin(); |
| 152 | End = MN->memoperands_end(); |
| 153 | } |
| 154 | |
Evan Cheng | c589e03 | 2010-01-22 03:36:51 +0000 | [diff] [blame] | 155 | DAG->MorphNodeTo(N, N->getOpcode(), VTList, &Ops[0], Ops.size()); |
Bill Wendling | 151d26d | 2010-06-23 18:16:24 +0000 | [diff] [blame] | 156 | |
| 157 | // Reset the memory references |
| 158 | if (MN) |
| 159 | MN->setMemRefs(Begin, End); |
Evan Cheng | c589e03 | 2010-01-22 03:36:51 +0000 | [diff] [blame] | 160 | } |
| 161 | |
Chris Lattner | 29d8f0c | 2010-12-23 17:24:32 +0000 | [diff] [blame] | 162 | /// ClusterNeighboringLoads - Force nearby loads together by "gluing" them. |
Evan Cheng | c589e03 | 2010-01-22 03:36:51 +0000 | [diff] [blame] | 163 | /// This function finds loads of the same base and different offsets. If the |
Chris Lattner | f1b4eaf | 2010-12-21 02:38:05 +0000 | [diff] [blame] | 164 | /// offsets are not far apart (target specific), it add MVT::Glue inputs and |
Evan Cheng | c589e03 | 2010-01-22 03:36:51 +0000 | [diff] [blame] | 165 | /// outputs to ensure they are scheduled together and in order. This |
| 166 | /// optimization may benefit some targets by improving cache locality. |
Evan Cheng | 302ef83 | 2010-06-10 02:09:31 +0000 | [diff] [blame] | 167 | void ScheduleDAGSDNodes::ClusterNeighboringLoads(SDNode *Node) { |
| 168 | SDNode *Chain = 0; |
| 169 | unsigned NumOps = Node->getNumOperands(); |
| 170 | if (Node->getOperand(NumOps-1).getValueType() == MVT::Other) |
| 171 | Chain = Node->getOperand(NumOps-1).getNode(); |
| 172 | if (!Chain) |
| 173 | return; |
| 174 | |
| 175 | // Look for other loads of the same chain. Find loads that are loading from |
| 176 | // the same base pointer and different offsets. |
Evan Cheng | c589e03 | 2010-01-22 03:36:51 +0000 | [diff] [blame] | 177 | SmallPtrSet<SDNode*, 16> Visited; |
| 178 | SmallVector<int64_t, 4> Offsets; |
| 179 | DenseMap<long long, SDNode*> O2SMap; // Map from offset to SDNode. |
Evan Cheng | 302ef83 | 2010-06-10 02:09:31 +0000 | [diff] [blame] | 180 | bool Cluster = false; |
| 181 | SDNode *Base = Node; |
Evan Cheng | 302ef83 | 2010-06-10 02:09:31 +0000 | [diff] [blame] | 182 | for (SDNode::use_iterator I = Chain->use_begin(), E = Chain->use_end(); |
| 183 | I != E; ++I) { |
| 184 | SDNode *User = *I; |
| 185 | if (User == Node || !Visited.insert(User)) |
| 186 | continue; |
| 187 | int64_t Offset1, Offset2; |
| 188 | if (!TII->areLoadsFromSameBasePtr(Base, User, Offset1, Offset2) || |
| 189 | Offset1 == Offset2) |
| 190 | // FIXME: Should be ok if they addresses are identical. But earlier |
| 191 | // optimizations really should have eliminated one of the loads. |
| 192 | continue; |
| 193 | if (O2SMap.insert(std::make_pair(Offset1, Base)).second) |
| 194 | Offsets.push_back(Offset1); |
| 195 | O2SMap.insert(std::make_pair(Offset2, User)); |
| 196 | Offsets.push_back(Offset2); |
Duncan Sands | b447c4e | 2010-06-25 14:48:39 +0000 | [diff] [blame] | 197 | if (Offset2 < Offset1) |
Evan Cheng | 302ef83 | 2010-06-10 02:09:31 +0000 | [diff] [blame] | 198 | Base = User; |
Evan Cheng | 302ef83 | 2010-06-10 02:09:31 +0000 | [diff] [blame] | 199 | Cluster = true; |
| 200 | } |
| 201 | |
| 202 | if (!Cluster) |
| 203 | return; |
| 204 | |
| 205 | // Sort them in increasing order. |
| 206 | std::sort(Offsets.begin(), Offsets.end()); |
| 207 | |
| 208 | // Check if the loads are close enough. |
| 209 | SmallVector<SDNode*, 4> Loads; |
| 210 | unsigned NumLoads = 0; |
| 211 | int64_t BaseOff = Offsets[0]; |
| 212 | SDNode *BaseLoad = O2SMap[BaseOff]; |
| 213 | Loads.push_back(BaseLoad); |
| 214 | for (unsigned i = 1, e = Offsets.size(); i != e; ++i) { |
| 215 | int64_t Offset = Offsets[i]; |
| 216 | SDNode *Load = O2SMap[Offset]; |
| 217 | if (!TII->shouldScheduleLoadsNear(BaseLoad, Load, BaseOff, Offset,NumLoads)) |
| 218 | break; // Stop right here. Ignore loads that are further away. |
| 219 | Loads.push_back(Load); |
| 220 | ++NumLoads; |
| 221 | } |
| 222 | |
| 223 | if (NumLoads == 0) |
| 224 | return; |
| 225 | |
Chris Lattner | f1b4eaf | 2010-12-21 02:38:05 +0000 | [diff] [blame] | 226 | // Cluster loads by adding MVT::Glue outputs and inputs. This also |
Evan Cheng | 302ef83 | 2010-06-10 02:09:31 +0000 | [diff] [blame] | 227 | // ensure they are scheduled in order of increasing addresses. |
| 228 | SDNode *Lead = Loads[0]; |
Chris Lattner | 29d8f0c | 2010-12-23 17:24:32 +0000 | [diff] [blame] | 229 | AddGlue(Lead, SDValue(0, 0), true, DAG); |
Bill Wendling | 151d26d | 2010-06-23 18:16:24 +0000 | [diff] [blame] | 230 | |
Chris Lattner | 29d8f0c | 2010-12-23 17:24:32 +0000 | [diff] [blame] | 231 | SDValue InGlue = SDValue(Lead, Lead->getNumValues() - 1); |
Bill Wendling | 10707f3 | 2010-06-24 22:00:37 +0000 | [diff] [blame] | 232 | for (unsigned I = 1, E = Loads.size(); I != E; ++I) { |
Chris Lattner | 29d8f0c | 2010-12-23 17:24:32 +0000 | [diff] [blame] | 233 | bool OutGlue = I < E - 1; |
Bill Wendling | 10707f3 | 2010-06-24 22:00:37 +0000 | [diff] [blame] | 234 | SDNode *Load = Loads[I]; |
| 235 | |
Chris Lattner | 29d8f0c | 2010-12-23 17:24:32 +0000 | [diff] [blame] | 236 | AddGlue(Load, InGlue, OutGlue, DAG); |
Bill Wendling | 151d26d | 2010-06-23 18:16:24 +0000 | [diff] [blame] | 237 | |
Chris Lattner | 29d8f0c | 2010-12-23 17:24:32 +0000 | [diff] [blame] | 238 | if (OutGlue) |
| 239 | InGlue = SDValue(Load, Load->getNumValues() - 1); |
Bill Wendling | 151d26d | 2010-06-23 18:16:24 +0000 | [diff] [blame] | 240 | |
Evan Cheng | 302ef83 | 2010-06-10 02:09:31 +0000 | [diff] [blame] | 241 | ++LoadsClustered; |
| 242 | } |
| 243 | } |
| 244 | |
| 245 | /// ClusterNodes - Cluster certain nodes which should be scheduled together. |
| 246 | /// |
| 247 | void ScheduleDAGSDNodes::ClusterNodes() { |
Evan Cheng | c589e03 | 2010-01-22 03:36:51 +0000 | [diff] [blame] | 248 | for (SelectionDAG::allnodes_iterator NI = DAG->allnodes_begin(), |
| 249 | E = DAG->allnodes_end(); NI != E; ++NI) { |
| 250 | SDNode *Node = &*NI; |
| 251 | if (!Node || !Node->isMachineOpcode()) |
| 252 | continue; |
| 253 | |
| 254 | unsigned Opc = Node->getMachineOpcode(); |
| 255 | const TargetInstrDesc &TID = TII->get(Opc); |
Evan Cheng | 302ef83 | 2010-06-10 02:09:31 +0000 | [diff] [blame] | 256 | if (TID.mayLoad()) |
| 257 | // Cluster loads from "near" addresses into combined SUnits. |
| 258 | ClusterNeighboringLoads(Node); |
Evan Cheng | c589e03 | 2010-01-22 03:36:51 +0000 | [diff] [blame] | 259 | } |
| 260 | } |
| 261 | |
Dan Gohman | 343f0c0 | 2008-11-19 23:18:57 +0000 | [diff] [blame] | 262 | void ScheduleDAGSDNodes::BuildSchedUnits() { |
Dan Gohman | e1dfc7d | 2008-12-23 17:24:50 +0000 | [diff] [blame] | 263 | // During scheduling, the NodeId field of SDNode is used to map SDNodes |
| 264 | // to their associated SUnits by holding SUnits table indices. A value |
| 265 | // of -1 means the SDNode does not yet have an associated SUnit. |
| 266 | unsigned NumNodes = 0; |
| 267 | for (SelectionDAG::allnodes_iterator NI = DAG->allnodes_begin(), |
| 268 | E = DAG->allnodes_end(); NI != E; ++NI) { |
| 269 | NI->setNodeId(-1); |
| 270 | ++NumNodes; |
| 271 | } |
| 272 | |
Dan Gohman | 343f0c0 | 2008-11-19 23:18:57 +0000 | [diff] [blame] | 273 | // Reserve entries in the vector for each of the SUnits we are creating. This |
| 274 | // ensure that reallocation of the vector won't happen, so SUnit*'s won't get |
| 275 | // invalidated. |
Dan Gohman | 89b64bd | 2008-12-17 04:30:46 +0000 | [diff] [blame] | 276 | // FIXME: Multiply by 2 because we may clone nodes during scheduling. |
| 277 | // This is a temporary workaround. |
Dan Gohman | e1dfc7d | 2008-12-23 17:24:50 +0000 | [diff] [blame] | 278 | SUnits.reserve(NumNodes * 2); |
Andrew Trick | cd5af07 | 2011-02-03 23:00:17 +0000 | [diff] [blame] | 279 | |
Chris Lattner | 736a6ea | 2010-02-24 06:11:37 +0000 | [diff] [blame] | 280 | // Add all nodes in depth first order. |
| 281 | SmallVector<SDNode*, 64> Worklist; |
| 282 | SmallPtrSet<SDNode*, 64> Visited; |
| 283 | Worklist.push_back(DAG->getRoot().getNode()); |
| 284 | Visited.insert(DAG->getRoot().getNode()); |
Andrew Trick | cd5af07 | 2011-02-03 23:00:17 +0000 | [diff] [blame] | 285 | |
Chris Lattner | 736a6ea | 2010-02-24 06:11:37 +0000 | [diff] [blame] | 286 | while (!Worklist.empty()) { |
| 287 | SDNode *NI = Worklist.pop_back_val(); |
Andrew Trick | cd5af07 | 2011-02-03 23:00:17 +0000 | [diff] [blame] | 288 | |
Chris Lattner | 736a6ea | 2010-02-24 06:11:37 +0000 | [diff] [blame] | 289 | // Add all operands to the worklist unless they've already been added. |
| 290 | for (unsigned i = 0, e = NI->getNumOperands(); i != e; ++i) |
| 291 | if (Visited.insert(NI->getOperand(i).getNode())) |
| 292 | Worklist.push_back(NI->getOperand(i).getNode()); |
Andrew Trick | cd5af07 | 2011-02-03 23:00:17 +0000 | [diff] [blame] | 293 | |
Dan Gohman | 343f0c0 | 2008-11-19 23:18:57 +0000 | [diff] [blame] | 294 | if (isPassiveNode(NI)) // Leaf node, e.g. a TargetImmediate. |
| 295 | continue; |
Andrew Trick | cd5af07 | 2011-02-03 23:00:17 +0000 | [diff] [blame] | 296 | |
Dan Gohman | 343f0c0 | 2008-11-19 23:18:57 +0000 | [diff] [blame] | 297 | // If this node has already been processed, stop now. |
| 298 | if (NI->getNodeId() != -1) continue; |
Andrew Trick | cd5af07 | 2011-02-03 23:00:17 +0000 | [diff] [blame] | 299 | |
Dan Gohman | 343f0c0 | 2008-11-19 23:18:57 +0000 | [diff] [blame] | 300 | SUnit *NodeSUnit = NewSUnit(NI); |
Andrew Trick | cd5af07 | 2011-02-03 23:00:17 +0000 | [diff] [blame] | 301 | |
Chris Lattner | 29d8f0c | 2010-12-23 17:24:32 +0000 | [diff] [blame] | 302 | // See if anything is glued to this node, if so, add them to glued |
| 303 | // nodes. Nodes can have at most one glue input and one glue output. Glue |
| 304 | // is required to be the last operand and result of a node. |
Andrew Trick | cd5af07 | 2011-02-03 23:00:17 +0000 | [diff] [blame] | 305 | |
Chris Lattner | 29d8f0c | 2010-12-23 17:24:32 +0000 | [diff] [blame] | 306 | // Scan up to find glued preds. |
Dan Gohman | 343f0c0 | 2008-11-19 23:18:57 +0000 | [diff] [blame] | 307 | SDNode *N = NI; |
Dan Gohman | db95fa1 | 2009-03-20 20:42:23 +0000 | [diff] [blame] | 308 | while (N->getNumOperands() && |
Chris Lattner | f1b4eaf | 2010-12-21 02:38:05 +0000 | [diff] [blame] | 309 | N->getOperand(N->getNumOperands()-1).getValueType() == MVT::Glue) { |
Dan Gohman | db95fa1 | 2009-03-20 20:42:23 +0000 | [diff] [blame] | 310 | N = N->getOperand(N->getNumOperands()-1).getNode(); |
| 311 | assert(N->getNodeId() == -1 && "Node already inserted!"); |
| 312 | N->setNodeId(NodeSUnit->NodeNum); |
Evan Cheng | 8239daf | 2010-11-03 00:45:17 +0000 | [diff] [blame] | 313 | if (N->isMachineOpcode() && TII->get(N->getMachineOpcode()).isCall()) |
| 314 | NodeSUnit->isCall = true; |
Dan Gohman | 343f0c0 | 2008-11-19 23:18:57 +0000 | [diff] [blame] | 315 | } |
Andrew Trick | cd5af07 | 2011-02-03 23:00:17 +0000 | [diff] [blame] | 316 | |
Chris Lattner | 29d8f0c | 2010-12-23 17:24:32 +0000 | [diff] [blame] | 317 | // Scan down to find any glued succs. |
Dan Gohman | 343f0c0 | 2008-11-19 23:18:57 +0000 | [diff] [blame] | 318 | N = NI; |
Chris Lattner | f1b4eaf | 2010-12-21 02:38:05 +0000 | [diff] [blame] | 319 | while (N->getValueType(N->getNumValues()-1) == MVT::Glue) { |
Chris Lattner | 29d8f0c | 2010-12-23 17:24:32 +0000 | [diff] [blame] | 320 | SDValue GlueVal(N, N->getNumValues()-1); |
Andrew Trick | cd5af07 | 2011-02-03 23:00:17 +0000 | [diff] [blame] | 321 | |
Chris Lattner | 29d8f0c | 2010-12-23 17:24:32 +0000 | [diff] [blame] | 322 | // There are either zero or one users of the Glue result. |
| 323 | bool HasGlueUse = false; |
Andrew Trick | cd5af07 | 2011-02-03 23:00:17 +0000 | [diff] [blame] | 324 | for (SDNode::use_iterator UI = N->use_begin(), E = N->use_end(); |
Dan Gohman | 343f0c0 | 2008-11-19 23:18:57 +0000 | [diff] [blame] | 325 | UI != E; ++UI) |
Chris Lattner | 29d8f0c | 2010-12-23 17:24:32 +0000 | [diff] [blame] | 326 | if (GlueVal.isOperandOf(*UI)) { |
| 327 | HasGlueUse = true; |
Dan Gohman | 343f0c0 | 2008-11-19 23:18:57 +0000 | [diff] [blame] | 328 | assert(N->getNodeId() == -1 && "Node already inserted!"); |
| 329 | N->setNodeId(NodeSUnit->NodeNum); |
| 330 | N = *UI; |
Evan Cheng | 8239daf | 2010-11-03 00:45:17 +0000 | [diff] [blame] | 331 | if (N->isMachineOpcode() && TII->get(N->getMachineOpcode()).isCall()) |
| 332 | NodeSUnit->isCall = true; |
Dan Gohman | 343f0c0 | 2008-11-19 23:18:57 +0000 | [diff] [blame] | 333 | break; |
| 334 | } |
Chris Lattner | 29d8f0c | 2010-12-23 17:24:32 +0000 | [diff] [blame] | 335 | if (!HasGlueUse) break; |
Dan Gohman | 343f0c0 | 2008-11-19 23:18:57 +0000 | [diff] [blame] | 336 | } |
Andrew Trick | cd5af07 | 2011-02-03 23:00:17 +0000 | [diff] [blame] | 337 | |
Chris Lattner | 29d8f0c | 2010-12-23 17:24:32 +0000 | [diff] [blame] | 338 | // If there are glue operands involved, N is now the bottom-most node |
| 339 | // of the sequence of nodes that are glued together. |
Dan Gohman | 343f0c0 | 2008-11-19 23:18:57 +0000 | [diff] [blame] | 340 | // Update the SUnit. |
| 341 | NodeSUnit->setNode(N); |
| 342 | assert(N->getNodeId() == -1 && "Node already inserted!"); |
| 343 | N->setNodeId(NodeSUnit->NodeNum); |
| 344 | |
Andrew Trick | c558bf3 | 2011-04-12 20:14:07 +0000 | [diff] [blame^] | 345 | // Set isVRegCycle if the node operands are live into and value is live out |
| 346 | // of a single block loop. |
| 347 | InitVRegCycleFlag(NodeSUnit); |
| 348 | |
Andrew Trick | 92e9466 | 2011-02-04 03:18:17 +0000 | [diff] [blame] | 349 | // Compute NumRegDefsLeft. This must be done before AddSchedEdges. |
| 350 | InitNumRegDefsLeft(NodeSUnit); |
| 351 | |
Dan Gohman | 787782f | 2008-11-21 01:44:51 +0000 | [diff] [blame] | 352 | // Assign the Latency field of NodeSUnit using target-provided information. |
Evan Cheng | e163168 | 2010-05-19 22:42:23 +0000 | [diff] [blame] | 353 | ComputeLatency(NodeSUnit); |
Dan Gohman | 343f0c0 | 2008-11-19 23:18:57 +0000 | [diff] [blame] | 354 | } |
Dan Gohman | c9a5b9e | 2008-12-23 18:36:58 +0000 | [diff] [blame] | 355 | } |
| 356 | |
| 357 | void ScheduleDAGSDNodes::AddSchedEdges() { |
David Goodwin | 7104616 | 2009-08-13 16:05:04 +0000 | [diff] [blame] | 358 | const TargetSubtarget &ST = TM.getSubtarget<TargetSubtarget>(); |
| 359 | |
David Goodwin | dc4bdcd | 2009-08-19 16:08:58 +0000 | [diff] [blame] | 360 | // Check to see if the scheduler cares about latencies. |
| 361 | bool UnitLatencies = ForceUnitLatencies(); |
| 362 | |
Dan Gohman | 343f0c0 | 2008-11-19 23:18:57 +0000 | [diff] [blame] | 363 | // Pass 2: add the preds, succs, etc. |
| 364 | for (unsigned su = 0, e = SUnits.size(); su != e; ++su) { |
| 365 | SUnit *SU = &SUnits[su]; |
| 366 | SDNode *MainNode = SU->getNode(); |
Andrew Trick | cd5af07 | 2011-02-03 23:00:17 +0000 | [diff] [blame] | 367 | |
Dan Gohman | 343f0c0 | 2008-11-19 23:18:57 +0000 | [diff] [blame] | 368 | if (MainNode->isMachineOpcode()) { |
| 369 | unsigned Opc = MainNode->getMachineOpcode(); |
| 370 | const TargetInstrDesc &TID = TII->get(Opc); |
| 371 | for (unsigned i = 0; i != TID.getNumOperands(); ++i) { |
| 372 | if (TID.getOperandConstraint(i, TOI::TIED_TO) != -1) { |
| 373 | SU->isTwoAddress = true; |
| 374 | break; |
| 375 | } |
| 376 | } |
| 377 | if (TID.isCommutable()) |
| 378 | SU->isCommutable = true; |
| 379 | } |
Andrew Trick | cd5af07 | 2011-02-03 23:00:17 +0000 | [diff] [blame] | 380 | |
Dan Gohman | 343f0c0 | 2008-11-19 23:18:57 +0000 | [diff] [blame] | 381 | // Find all predecessors and successors of the group. |
Chris Lattner | 29d8f0c | 2010-12-23 17:24:32 +0000 | [diff] [blame] | 382 | for (SDNode *N = SU->getNode(); N; N = N->getGluedNode()) { |
Dan Gohman | 343f0c0 | 2008-11-19 23:18:57 +0000 | [diff] [blame] | 383 | if (N->isMachineOpcode() && |
Dan Gohman | 3974667 | 2009-03-23 16:10:52 +0000 | [diff] [blame] | 384 | TII->get(N->getMachineOpcode()).getImplicitDefs()) { |
| 385 | SU->hasPhysRegClobbers = true; |
Dan Gohman | bcea859 | 2009-10-10 01:32:21 +0000 | [diff] [blame] | 386 | unsigned NumUsed = InstrEmitter::CountResults(N); |
Dan Gohman | 8cccf0e | 2009-03-23 17:39:36 +0000 | [diff] [blame] | 387 | while (NumUsed != 0 && !N->hasAnyUseOfValue(NumUsed - 1)) |
| 388 | --NumUsed; // Skip over unused values at the end. |
| 389 | if (NumUsed > TII->get(N->getMachineOpcode()).getNumDefs()) |
Dan Gohman | 3974667 | 2009-03-23 16:10:52 +0000 | [diff] [blame] | 390 | SU->hasPhysRegDefs = true; |
| 391 | } |
Andrew Trick | cd5af07 | 2011-02-03 23:00:17 +0000 | [diff] [blame] | 392 | |
Dan Gohman | 343f0c0 | 2008-11-19 23:18:57 +0000 | [diff] [blame] | 393 | for (unsigned i = 0, e = N->getNumOperands(); i != e; ++i) { |
| 394 | SDNode *OpN = N->getOperand(i).getNode(); |
| 395 | if (isPassiveNode(OpN)) continue; // Not scheduled. |
| 396 | SUnit *OpSU = &SUnits[OpN->getNodeId()]; |
| 397 | assert(OpSU && "Node has no SUnit!"); |
| 398 | if (OpSU == SU) continue; // In the same group. |
| 399 | |
Owen Anderson | e50ed30 | 2009-08-10 22:56:29 +0000 | [diff] [blame] | 400 | EVT OpVT = N->getOperand(i).getValueType(); |
Chris Lattner | 29d8f0c | 2010-12-23 17:24:32 +0000 | [diff] [blame] | 401 | assert(OpVT != MVT::Glue && "Glued nodes should be in same sunit!"); |
Owen Anderson | 825b72b | 2009-08-11 20:47:22 +0000 | [diff] [blame] | 402 | bool isChain = OpVT == MVT::Other; |
Dan Gohman | 343f0c0 | 2008-11-19 23:18:57 +0000 | [diff] [blame] | 403 | |
| 404 | unsigned PhysReg = 0; |
Evan Cheng | c29a56d | 2009-01-12 03:19:55 +0000 | [diff] [blame] | 405 | int Cost = 1; |
Dan Gohman | 343f0c0 | 2008-11-19 23:18:57 +0000 | [diff] [blame] | 406 | // Determine if this is a physical register dependency. |
Evan Cheng | c29a56d | 2009-01-12 03:19:55 +0000 | [diff] [blame] | 407 | CheckForPhysRegDependency(OpN, N, i, TRI, TII, PhysReg, Cost); |
Dan Gohman | 54e4c36 | 2008-12-09 22:54:47 +0000 | [diff] [blame] | 408 | assert((PhysReg == 0 || !isChain) && |
| 409 | "Chain dependence via physreg data?"); |
Evan Cheng | c29a56d | 2009-01-12 03:19:55 +0000 | [diff] [blame] | 410 | // FIXME: See ScheduleDAGSDNodes::EmitCopyFromReg. For now, scheduler |
| 411 | // emits a copy from the physical register to a virtual register unless |
| 412 | // it requires a cross class copy (cost < 0). That means we are only |
| 413 | // treating "expensive to copy" register dependency as physical register |
| 414 | // dependency. This may change in the future though. |
| 415 | if (Cost >= 0) |
| 416 | PhysReg = 0; |
David Goodwin | 7104616 | 2009-08-13 16:05:04 +0000 | [diff] [blame] | 417 | |
Evan Cheng | 046fa3f | 2010-05-28 23:26:21 +0000 | [diff] [blame] | 418 | // If this is a ctrl dep, latency is 1. |
Andrew Trick | c558bf3 | 2011-04-12 20:14:07 +0000 | [diff] [blame^] | 419 | unsigned OpLatency = isChain ? 1 : OpSU->Latency; |
Evan Cheng | 046fa3f | 2010-05-28 23:26:21 +0000 | [diff] [blame] | 420 | const SDep &dep = SDep(OpSU, isChain ? SDep::Order : SDep::Data, |
| 421 | OpLatency, PhysReg); |
David Goodwin | dc4bdcd | 2009-08-19 16:08:58 +0000 | [diff] [blame] | 422 | if (!isChain && !UnitLatencies) { |
Evan Cheng | 15a16de | 2010-05-20 06:13:19 +0000 | [diff] [blame] | 423 | ComputeOperandLatency(OpN, N, i, const_cast<SDep &>(dep)); |
Dan Gohman | 3fb150a | 2010-04-17 17:42:52 +0000 | [diff] [blame] | 424 | ST.adjustSchedDependency(OpSU, SU, const_cast<SDep &>(dep)); |
David Goodwin | dc4bdcd | 2009-08-19 16:08:58 +0000 | [diff] [blame] | 425 | } |
David Goodwin | 7104616 | 2009-08-13 16:05:04 +0000 | [diff] [blame] | 426 | |
Andrew Trick | 4bbf467 | 2011-03-09 19:12:43 +0000 | [diff] [blame] | 427 | if (!SU->addPred(dep) && !dep.isCtrl() && OpSU->NumRegDefsLeft > 1) { |
Andrew Trick | 92e9466 | 2011-02-04 03:18:17 +0000 | [diff] [blame] | 428 | // Multiple register uses are combined in the same SUnit. For example, |
| 429 | // we could have a set of glued nodes with all their defs consumed by |
| 430 | // another set of glued nodes. Register pressure tracking sees this as |
| 431 | // a single use, so to keep pressure balanced we reduce the defs. |
Andrew Trick | 4bbf467 | 2011-03-09 19:12:43 +0000 | [diff] [blame] | 432 | // |
| 433 | // We can't tell (without more book-keeping) if this results from |
| 434 | // glued nodes or duplicate operands. As long as we don't reduce |
| 435 | // NumRegDefsLeft to zero, we handle the common cases well. |
Andrew Trick | 92e9466 | 2011-02-04 03:18:17 +0000 | [diff] [blame] | 436 | --OpSU->NumRegDefsLeft; |
| 437 | } |
Dan Gohman | 343f0c0 | 2008-11-19 23:18:57 +0000 | [diff] [blame] | 438 | } |
| 439 | } |
| 440 | } |
| 441 | } |
| 442 | |
Dan Gohman | c9a5b9e | 2008-12-23 18:36:58 +0000 | [diff] [blame] | 443 | /// BuildSchedGraph - Build the SUnit graph from the selection dag that we |
| 444 | /// are input. This SUnit graph is similar to the SelectionDAG, but |
| 445 | /// excludes nodes that aren't interesting to scheduling, and represents |
Chris Lattner | 29d8f0c | 2010-12-23 17:24:32 +0000 | [diff] [blame] | 446 | /// glued together nodes with a single SUnit. |
Dan Gohman | 98976e4 | 2009-10-09 23:33:48 +0000 | [diff] [blame] | 447 | void ScheduleDAGSDNodes::BuildSchedGraph(AliasAnalysis *AA) { |
Evan Cheng | 302ef83 | 2010-06-10 02:09:31 +0000 | [diff] [blame] | 448 | // Cluster certain nodes which should be scheduled together. |
| 449 | ClusterNodes(); |
Dan Gohman | c9a5b9e | 2008-12-23 18:36:58 +0000 | [diff] [blame] | 450 | // Populate the SUnits array. |
| 451 | BuildSchedUnits(); |
| 452 | // Compute all the scheduling dependencies between nodes. |
| 453 | AddSchedEdges(); |
| 454 | } |
| 455 | |
Andrew Trick | 92e9466 | 2011-02-04 03:18:17 +0000 | [diff] [blame] | 456 | // Initialize NumNodeDefs for the current Node's opcode. |
| 457 | void ScheduleDAGSDNodes::RegDefIter::InitNodeNumDefs() { |
Eric Christopher | 2944944 | 2011-03-08 19:35:47 +0000 | [diff] [blame] | 458 | // Check for phys reg copy. |
| 459 | if (!Node) |
| 460 | return; |
| 461 | |
Andrew Trick | 92e9466 | 2011-02-04 03:18:17 +0000 | [diff] [blame] | 462 | if (!Node->isMachineOpcode()) { |
| 463 | if (Node->getOpcode() == ISD::CopyFromReg) |
| 464 | NodeNumDefs = 1; |
| 465 | else |
| 466 | NodeNumDefs = 0; |
| 467 | return; |
| 468 | } |
| 469 | unsigned POpc = Node->getMachineOpcode(); |
| 470 | if (POpc == TargetOpcode::IMPLICIT_DEF) { |
| 471 | // No register need be allocated for this. |
| 472 | NodeNumDefs = 0; |
| 473 | return; |
| 474 | } |
| 475 | unsigned NRegDefs = SchedDAG->TII->get(Node->getMachineOpcode()).getNumDefs(); |
| 476 | // Some instructions define regs that are not represented in the selection DAG |
| 477 | // (e.g. unused flags). See tMOVi8. Make sure we don't access past NumValues. |
| 478 | NodeNumDefs = std::min(Node->getNumValues(), NRegDefs); |
| 479 | DefIdx = 0; |
| 480 | } |
| 481 | |
| 482 | // Construct a RegDefIter for this SUnit and find the first valid value. |
| 483 | ScheduleDAGSDNodes::RegDefIter::RegDefIter(const SUnit *SU, |
| 484 | const ScheduleDAGSDNodes *SD) |
| 485 | : SchedDAG(SD), Node(SU->getNode()), DefIdx(0), NodeNumDefs(0) { |
| 486 | InitNodeNumDefs(); |
| 487 | Advance(); |
| 488 | } |
| 489 | |
| 490 | // Advance to the next valid value defined by the SUnit. |
| 491 | void ScheduleDAGSDNodes::RegDefIter::Advance() { |
| 492 | for (;Node;) { // Visit all glued nodes. |
| 493 | for (;DefIdx < NodeNumDefs; ++DefIdx) { |
| 494 | if (!Node->hasAnyUseOfValue(DefIdx)) |
| 495 | continue; |
| 496 | if (Node->isMachineOpcode() && |
| 497 | Node->getMachineOpcode() == TargetOpcode::EXTRACT_SUBREG) { |
| 498 | // Propagate the incoming (full-register) type. I doubt it's needed. |
| 499 | ValueType = Node->getOperand(0).getValueType(); |
| 500 | } |
| 501 | else { |
| 502 | ValueType = Node->getValueType(DefIdx); |
| 503 | } |
| 504 | ++DefIdx; |
| 505 | return; // Found a normal regdef. |
| 506 | } |
| 507 | Node = Node->getGluedNode(); |
| 508 | if (Node == NULL) { |
| 509 | return; // No values left to visit. |
| 510 | } |
| 511 | InitNodeNumDefs(); |
| 512 | } |
| 513 | } |
| 514 | |
Andrew Trick | c558bf3 | 2011-04-12 20:14:07 +0000 | [diff] [blame^] | 515 | // Set isVRegCycle if this node's single use is CopyToReg and its only active |
| 516 | // data operands are CopyFromReg. |
| 517 | // |
| 518 | // This is only relevant for single-block loops, in which case the VRegCycle |
| 519 | // node is likely an induction variable in which the operand and target virtual |
| 520 | // registers should be coalesced (e.g. pre/post increment values). Setting the |
| 521 | // isVRegCycle flag helps the scheduler prioritize other uses of the same |
| 522 | // CopyFromReg so that this node becomes the virtual register "kill". This |
| 523 | // avoids interference between the values live in and out of the block and |
| 524 | // eliminates a copy inside the loop. |
| 525 | void ScheduleDAGSDNodes::InitVRegCycleFlag(SUnit *SU) { |
| 526 | if (!BB->isSuccessor(BB)) |
| 527 | return; |
| 528 | |
| 529 | SDNode *N = SU->getNode(); |
| 530 | if (N->getGluedNode()) |
| 531 | return; |
| 532 | |
| 533 | if (!N->hasOneUse() || N->use_begin()->getOpcode() != ISD::CopyToReg) |
| 534 | return; |
| 535 | |
| 536 | bool FoundLiveIn = false; |
| 537 | for (SDNode::op_iterator OI = N->op_begin(), E = N->op_end(); OI != E; ++OI) { |
| 538 | EVT OpVT = OI->getValueType(); |
| 539 | assert(OpVT != MVT::Glue && "Glued nodes should be in same sunit!"); |
| 540 | |
| 541 | if (OpVT == MVT::Other) |
| 542 | continue; // ignore chain operands |
| 543 | |
| 544 | if (isPassiveNode(OI->getNode())) |
| 545 | continue; // ignore constants and such |
| 546 | |
| 547 | if (OI->getNode()->getOpcode() != ISD::CopyFromReg) |
| 548 | return; |
| 549 | |
| 550 | FoundLiveIn = true; |
| 551 | } |
| 552 | if (FoundLiveIn) |
| 553 | SU->isVRegCycle = true; |
| 554 | } |
| 555 | |
Andrew Trick | 92e9466 | 2011-02-04 03:18:17 +0000 | [diff] [blame] | 556 | void ScheduleDAGSDNodes::InitNumRegDefsLeft(SUnit *SU) { |
| 557 | assert(SU->NumRegDefsLeft == 0 && "expect a new node"); |
| 558 | for (RegDefIter I(SU, this); I.IsValid(); I.Advance()) { |
| 559 | assert(SU->NumRegDefsLeft < USHRT_MAX && "overflow is ok but unexpected"); |
| 560 | ++SU->NumRegDefsLeft; |
| 561 | } |
| 562 | } |
| 563 | |
Dan Gohman | 343f0c0 | 2008-11-19 23:18:57 +0000 | [diff] [blame] | 564 | void ScheduleDAGSDNodes::ComputeLatency(SUnit *SU) { |
Evan Cheng | e163168 | 2010-05-19 22:42:23 +0000 | [diff] [blame] | 565 | // Check to see if the scheduler cares about latencies. |
| 566 | if (ForceUnitLatencies()) { |
| 567 | SU->Latency = 1; |
| 568 | return; |
| 569 | } |
| 570 | |
Evan Cheng | 3ef1c87 | 2010-09-10 01:29:16 +0000 | [diff] [blame] | 571 | if (!InstrItins || InstrItins->isEmpty()) { |
Andrew Trick | 5e84e3c | 2011-03-05 09:18:16 +0000 | [diff] [blame] | 572 | SDNode *N = SU->getNode(); |
| 573 | if (N && N->isMachineOpcode() && |
| 574 | TII->isHighLatencyDef(N->getMachineOpcode())) |
Andrew Trick | e0ef509 | 2011-03-05 08:00:22 +0000 | [diff] [blame] | 575 | SU->Latency = HighLatencyCycles; |
| 576 | else |
| 577 | SU->Latency = 1; |
Evan Cheng | 15a16de | 2010-05-20 06:13:19 +0000 | [diff] [blame] | 578 | return; |
| 579 | } |
Andrew Trick | cd5af07 | 2011-02-03 23:00:17 +0000 | [diff] [blame] | 580 | |
Dan Gohman | 343f0c0 | 2008-11-19 23:18:57 +0000 | [diff] [blame] | 581 | // Compute the latency for the node. We use the sum of the latencies for |
Chris Lattner | 29d8f0c | 2010-12-23 17:24:32 +0000 | [diff] [blame] | 582 | // all nodes glued together into this SUnit. |
Dan Gohman | 343f0c0 | 2008-11-19 23:18:57 +0000 | [diff] [blame] | 583 | SU->Latency = 0; |
Chris Lattner | 29d8f0c | 2010-12-23 17:24:32 +0000 | [diff] [blame] | 584 | for (SDNode *N = SU->getNode(); N; N = N->getGluedNode()) |
Evan Cheng | 8239daf | 2010-11-03 00:45:17 +0000 | [diff] [blame] | 585 | if (N->isMachineOpcode()) |
| 586 | SU->Latency += TII->getInstrLatency(InstrItins, N); |
Dan Gohman | 343f0c0 | 2008-11-19 23:18:57 +0000 | [diff] [blame] | 587 | } |
| 588 | |
Evan Cheng | 15a16de | 2010-05-20 06:13:19 +0000 | [diff] [blame] | 589 | void ScheduleDAGSDNodes::ComputeOperandLatency(SDNode *Def, SDNode *Use, |
| 590 | unsigned OpIdx, SDep& dep) const{ |
| 591 | // Check to see if the scheduler cares about latencies. |
| 592 | if (ForceUnitLatencies()) |
| 593 | return; |
| 594 | |
Evan Cheng | 15a16de | 2010-05-20 06:13:19 +0000 | [diff] [blame] | 595 | if (dep.getKind() != SDep::Data) |
| 596 | return; |
| 597 | |
| 598 | unsigned DefIdx = Use->getOperand(OpIdx).getResNo(); |
Evan Cheng | 7e2fe91 | 2010-10-28 06:47:08 +0000 | [diff] [blame] | 599 | if (Use->isMachineOpcode()) |
| 600 | // Adjust the use operand index by num of defs. |
| 601 | OpIdx += TII->get(Use->getMachineOpcode()).getNumDefs(); |
Evan Cheng | a0792de | 2010-10-06 06:27:31 +0000 | [diff] [blame] | 602 | int Latency = TII->getOperandLatency(InstrItins, Def, DefIdx, Use, OpIdx); |
Evan Cheng | 0897515 | 2010-10-29 18:09:28 +0000 | [diff] [blame] | 603 | if (Latency > 1 && Use->getOpcode() == ISD::CopyToReg && |
| 604 | !BB->succ_empty()) { |
| 605 | unsigned Reg = cast<RegisterSDNode>(Use->getOperand(1))->getReg(); |
| 606 | if (TargetRegisterInfo::isVirtualRegister(Reg)) |
| 607 | // This copy is a liveout value. It is likely coalesced, so reduce the |
| 608 | // latency so not to penalize the def. |
| 609 | // FIXME: need target specific adjustment here? |
| 610 | Latency = (Latency > 1) ? Latency - 1 : 1; |
| 611 | } |
Evan Cheng | 3881cb7 | 2010-09-29 22:42:35 +0000 | [diff] [blame] | 612 | if (Latency >= 0) |
| 613 | dep.setLatency(Latency); |
Evan Cheng | 15a16de | 2010-05-20 06:13:19 +0000 | [diff] [blame] | 614 | } |
| 615 | |
Dan Gohman | 343f0c0 | 2008-11-19 23:18:57 +0000 | [diff] [blame] | 616 | void ScheduleDAGSDNodes::dumpNode(const SUnit *SU) const { |
Evan Cheng | c29a56d | 2009-01-12 03:19:55 +0000 | [diff] [blame] | 617 | if (!SU->getNode()) { |
David Greene | 84fa822 | 2010-01-05 01:25:11 +0000 | [diff] [blame] | 618 | dbgs() << "PHYS REG COPY\n"; |
Evan Cheng | c29a56d | 2009-01-12 03:19:55 +0000 | [diff] [blame] | 619 | return; |
| 620 | } |
| 621 | |
| 622 | SU->getNode()->dump(DAG); |
David Greene | 84fa822 | 2010-01-05 01:25:11 +0000 | [diff] [blame] | 623 | dbgs() << "\n"; |
Chris Lattner | 29d8f0c | 2010-12-23 17:24:32 +0000 | [diff] [blame] | 624 | SmallVector<SDNode *, 4> GluedNodes; |
| 625 | for (SDNode *N = SU->getNode()->getGluedNode(); N; N = N->getGluedNode()) |
| 626 | GluedNodes.push_back(N); |
| 627 | while (!GluedNodes.empty()) { |
David Greene | 84fa822 | 2010-01-05 01:25:11 +0000 | [diff] [blame] | 628 | dbgs() << " "; |
Chris Lattner | 29d8f0c | 2010-12-23 17:24:32 +0000 | [diff] [blame] | 629 | GluedNodes.back()->dump(DAG); |
David Greene | 84fa822 | 2010-01-05 01:25:11 +0000 | [diff] [blame] | 630 | dbgs() << "\n"; |
Chris Lattner | 29d8f0c | 2010-12-23 17:24:32 +0000 | [diff] [blame] | 631 | GluedNodes.pop_back(); |
Dan Gohman | 343f0c0 | 2008-11-19 23:18:57 +0000 | [diff] [blame] | 632 | } |
| 633 | } |
Dan Gohman | bcea859 | 2009-10-10 01:32:21 +0000 | [diff] [blame] | 634 | |
Evan Cheng | bfcb305 | 2010-03-25 01:38:16 +0000 | [diff] [blame] | 635 | namespace { |
| 636 | struct OrderSorter { |
| 637 | bool operator()(const std::pair<unsigned, MachineInstr*> &A, |
| 638 | const std::pair<unsigned, MachineInstr*> &B) { |
| 639 | return A.first < B.first; |
| 640 | } |
| 641 | }; |
| 642 | } |
| 643 | |
Devang Patel | 55d20e8 | 2011-01-26 18:20:04 +0000 | [diff] [blame] | 644 | /// ProcessSDDbgValues - Process SDDbgValues assoicated with this node. |
Andrew Trick | cd5af07 | 2011-02-03 23:00:17 +0000 | [diff] [blame] | 645 | static void ProcessSDDbgValues(SDNode *N, SelectionDAG *DAG, |
Devang Patel | 55d20e8 | 2011-01-26 18:20:04 +0000 | [diff] [blame] | 646 | InstrEmitter &Emitter, |
| 647 | SmallVector<std::pair<unsigned, MachineInstr*>, 32> &Orders, |
| 648 | DenseMap<SDValue, unsigned> &VRBaseMap, |
| 649 | unsigned Order) { |
| 650 | if (!N->getHasDebugValue()) |
| 651 | return; |
| 652 | |
| 653 | // Opportunistically insert immediate dbg_value uses, i.e. those with source |
| 654 | // order number right after the N. |
| 655 | MachineBasicBlock *BB = Emitter.getBlock(); |
| 656 | MachineBasicBlock::iterator InsertPos = Emitter.getInsertPos(); |
| 657 | SmallVector<SDDbgValue*,2> &DVs = DAG->GetDbgValues(N); |
| 658 | for (unsigned i = 0, e = DVs.size(); i != e; ++i) { |
| 659 | if (DVs[i]->isInvalidated()) |
| 660 | continue; |
| 661 | unsigned DVOrder = DVs[i]->getOrder(); |
| 662 | if (!Order || DVOrder == ++Order) { |
| 663 | MachineInstr *DbgMI = Emitter.EmitDbgValue(DVs[i], VRBaseMap); |
| 664 | if (DbgMI) { |
| 665 | Orders.push_back(std::make_pair(DVOrder, DbgMI)); |
| 666 | BB->insert(InsertPos, DbgMI); |
| 667 | } |
| 668 | DVs[i]->setIsInvalidated(); |
| 669 | } |
| 670 | } |
| 671 | } |
| 672 | |
Evan Cheng | bfcb305 | 2010-03-25 01:38:16 +0000 | [diff] [blame] | 673 | // ProcessSourceNode - Process nodes with source order numbers. These are added |
Jim Grosbach | d27946d | 2010-06-30 21:27:56 +0000 | [diff] [blame] | 674 | // to a vector which EmitSchedule uses to determine how to insert dbg_value |
Evan Cheng | bfcb305 | 2010-03-25 01:38:16 +0000 | [diff] [blame] | 675 | // instructions in the right order. |
| 676 | static void ProcessSourceNode(SDNode *N, SelectionDAG *DAG, |
| 677 | InstrEmitter &Emitter, |
Evan Cheng | bfcb305 | 2010-03-25 01:38:16 +0000 | [diff] [blame] | 678 | DenseMap<SDValue, unsigned> &VRBaseMap, |
| 679 | SmallVector<std::pair<unsigned, MachineInstr*>, 32> &Orders, |
| 680 | SmallSet<unsigned, 8> &Seen) { |
| 681 | unsigned Order = DAG->GetOrdering(N); |
Devang Patel | 39078a8 | 2011-01-27 00:13:27 +0000 | [diff] [blame] | 682 | if (!Order || !Seen.insert(Order)) { |
| 683 | // Process any valid SDDbgValues even if node does not have any order |
| 684 | // assigned. |
| 685 | ProcessSDDbgValues(N, DAG, Emitter, Orders, VRBaseMap, 0); |
Evan Cheng | bfcb305 | 2010-03-25 01:38:16 +0000 | [diff] [blame] | 686 | return; |
Devang Patel | 39078a8 | 2011-01-27 00:13:27 +0000 | [diff] [blame] | 687 | } |
Evan Cheng | bfcb305 | 2010-03-25 01:38:16 +0000 | [diff] [blame] | 688 | |
| 689 | MachineBasicBlock *BB = Emitter.getBlock(); |
Dan Gohman | 84023e0 | 2010-07-10 09:00:22 +0000 | [diff] [blame] | 690 | if (Emitter.getInsertPos() == BB->begin() || BB->back().isPHI()) { |
Evan Cheng | bfcb305 | 2010-03-25 01:38:16 +0000 | [diff] [blame] | 691 | // Did not insert any instruction. |
| 692 | Orders.push_back(std::make_pair(Order, (MachineInstr*)0)); |
| 693 | return; |
| 694 | } |
| 695 | |
Dan Gohman | 84023e0 | 2010-07-10 09:00:22 +0000 | [diff] [blame] | 696 | Orders.push_back(std::make_pair(Order, prior(Emitter.getInsertPos()))); |
Devang Patel | 55d20e8 | 2011-01-26 18:20:04 +0000 | [diff] [blame] | 697 | ProcessSDDbgValues(N, DAG, Emitter, Orders, VRBaseMap, Order); |
Evan Cheng | bfcb305 | 2010-03-25 01:38:16 +0000 | [diff] [blame] | 698 | } |
| 699 | |
| 700 | |
Dan Gohman | bcea859 | 2009-10-10 01:32:21 +0000 | [diff] [blame] | 701 | /// EmitSchedule - Emit the machine code in scheduled order. |
Dan Gohman | af1d8ca | 2010-05-01 00:01:06 +0000 | [diff] [blame] | 702 | MachineBasicBlock *ScheduleDAGSDNodes::EmitSchedule() { |
Dan Gohman | bcea859 | 2009-10-10 01:32:21 +0000 | [diff] [blame] | 703 | InstrEmitter Emitter(BB, InsertPos); |
| 704 | DenseMap<SDValue, unsigned> VRBaseMap; |
| 705 | DenseMap<SUnit*, unsigned> CopyVRBaseMap; |
Evan Cheng | bfcb305 | 2010-03-25 01:38:16 +0000 | [diff] [blame] | 706 | SmallVector<std::pair<unsigned, MachineInstr*>, 32> Orders; |
| 707 | SmallSet<unsigned, 8> Seen; |
| 708 | bool HasDbg = DAG->hasDebugValues(); |
Dale Johannesen | bfdf7f3 | 2010-03-10 22:13:47 +0000 | [diff] [blame] | 709 | |
Dale Johannesen | fdb42fa | 2010-04-26 20:06:49 +0000 | [diff] [blame] | 710 | // If this is the first BB, emit byval parameter dbg_value's. |
| 711 | if (HasDbg && BB->getParent()->begin() == MachineFunction::iterator(BB)) { |
| 712 | SDDbgInfo::DbgIterator PDI = DAG->ByvalParmDbgBegin(); |
| 713 | SDDbgInfo::DbgIterator PDE = DAG->ByvalParmDbgEnd(); |
| 714 | for (; PDI != PDE; ++PDI) { |
Dan Gohman | 891ff8f | 2010-04-30 19:35:33 +0000 | [diff] [blame] | 715 | MachineInstr *DbgMI= Emitter.EmitDbgValue(*PDI, VRBaseMap); |
Dale Johannesen | fdb42fa | 2010-04-26 20:06:49 +0000 | [diff] [blame] | 716 | if (DbgMI) |
Dan Gohman | 84023e0 | 2010-07-10 09:00:22 +0000 | [diff] [blame] | 717 | BB->insert(InsertPos, DbgMI); |
Dale Johannesen | fdb42fa | 2010-04-26 20:06:49 +0000 | [diff] [blame] | 718 | } |
| 719 | } |
| 720 | |
Dan Gohman | bcea859 | 2009-10-10 01:32:21 +0000 | [diff] [blame] | 721 | for (unsigned i = 0, e = Sequence.size(); i != e; i++) { |
| 722 | SUnit *SU = Sequence[i]; |
| 723 | if (!SU) { |
| 724 | // Null SUnit* is a noop. |
| 725 | EmitNoop(); |
| 726 | continue; |
| 727 | } |
| 728 | |
| 729 | // For pre-regalloc scheduling, create instructions corresponding to the |
Chris Lattner | 29d8f0c | 2010-12-23 17:24:32 +0000 | [diff] [blame] | 730 | // SDNode and any glued SDNodes and append them to the block. |
Dan Gohman | bcea859 | 2009-10-10 01:32:21 +0000 | [diff] [blame] | 731 | if (!SU->getNode()) { |
| 732 | // Emit a copy. |
| 733 | EmitPhysRegCopy(SU, CopyVRBaseMap); |
| 734 | continue; |
| 735 | } |
| 736 | |
Chris Lattner | 29d8f0c | 2010-12-23 17:24:32 +0000 | [diff] [blame] | 737 | SmallVector<SDNode *, 4> GluedNodes; |
| 738 | for (SDNode *N = SU->getNode()->getGluedNode(); N; |
| 739 | N = N->getGluedNode()) |
| 740 | GluedNodes.push_back(N); |
| 741 | while (!GluedNodes.empty()) { |
| 742 | SDNode *N = GluedNodes.back(); |
| 743 | Emitter.EmitNode(GluedNodes.back(), SU->OrigNode != SU, SU->isCloned, |
Dan Gohman | af1d8ca | 2010-05-01 00:01:06 +0000 | [diff] [blame] | 744 | VRBaseMap); |
Dale Johannesen | fdb42fa | 2010-04-26 20:06:49 +0000 | [diff] [blame] | 745 | // Remember the source order of the inserted instruction. |
Evan Cheng | bfcb305 | 2010-03-25 01:38:16 +0000 | [diff] [blame] | 746 | if (HasDbg) |
Dan Gohman | 891ff8f | 2010-04-30 19:35:33 +0000 | [diff] [blame] | 747 | ProcessSourceNode(N, DAG, Emitter, VRBaseMap, Orders, Seen); |
Chris Lattner | 29d8f0c | 2010-12-23 17:24:32 +0000 | [diff] [blame] | 748 | GluedNodes.pop_back(); |
Dan Gohman | bcea859 | 2009-10-10 01:32:21 +0000 | [diff] [blame] | 749 | } |
| 750 | Emitter.EmitNode(SU->getNode(), SU->OrigNode != SU, SU->isCloned, |
Dan Gohman | af1d8ca | 2010-05-01 00:01:06 +0000 | [diff] [blame] | 751 | VRBaseMap); |
Dale Johannesen | fdb42fa | 2010-04-26 20:06:49 +0000 | [diff] [blame] | 752 | // Remember the source order of the inserted instruction. |
Evan Cheng | bfcb305 | 2010-03-25 01:38:16 +0000 | [diff] [blame] | 753 | if (HasDbg) |
Dan Gohman | 891ff8f | 2010-04-30 19:35:33 +0000 | [diff] [blame] | 754 | ProcessSourceNode(SU->getNode(), DAG, Emitter, VRBaseMap, Orders, |
Evan Cheng | bfcb305 | 2010-03-25 01:38:16 +0000 | [diff] [blame] | 755 | Seen); |
| 756 | } |
| 757 | |
Dale Johannesen | fdb42fa | 2010-04-26 20:06:49 +0000 | [diff] [blame] | 758 | // Insert all the dbg_values which have not already been inserted in source |
Evan Cheng | bfcb305 | 2010-03-25 01:38:16 +0000 | [diff] [blame] | 759 | // order sequence. |
| 760 | if (HasDbg) { |
Dan Gohman | 84023e0 | 2010-07-10 09:00:22 +0000 | [diff] [blame] | 761 | MachineBasicBlock::iterator BBBegin = BB->getFirstNonPHI(); |
Evan Cheng | bfcb305 | 2010-03-25 01:38:16 +0000 | [diff] [blame] | 762 | |
| 763 | // Sort the source order instructions and use the order to insert debug |
| 764 | // values. |
| 765 | std::sort(Orders.begin(), Orders.end(), OrderSorter()); |
| 766 | |
| 767 | SDDbgInfo::DbgIterator DI = DAG->DbgBegin(); |
| 768 | SDDbgInfo::DbgIterator DE = DAG->DbgEnd(); |
| 769 | // Now emit the rest according to source order. |
| 770 | unsigned LastOrder = 0; |
Evan Cheng | bfcb305 | 2010-03-25 01:38:16 +0000 | [diff] [blame] | 771 | for (unsigned i = 0, e = Orders.size(); i != e && DI != DE; ++i) { |
| 772 | unsigned Order = Orders[i].first; |
| 773 | MachineInstr *MI = Orders[i].second; |
| 774 | // Insert all SDDbgValue's whose order(s) are before "Order". |
| 775 | if (!MI) |
| 776 | continue; |
Evan Cheng | bfcb305 | 2010-03-25 01:38:16 +0000 | [diff] [blame] | 777 | for (; DI != DE && |
| 778 | (*DI)->getOrder() >= LastOrder && (*DI)->getOrder() < Order; ++DI) { |
| 779 | if ((*DI)->isInvalidated()) |
| 780 | continue; |
Dan Gohman | 891ff8f | 2010-04-30 19:35:33 +0000 | [diff] [blame] | 781 | MachineInstr *DbgMI = Emitter.EmitDbgValue(*DI, VRBaseMap); |
Evan Cheng | 962021b | 2010-04-26 07:38:55 +0000 | [diff] [blame] | 782 | if (DbgMI) { |
| 783 | if (!LastOrder) |
| 784 | // Insert to start of the BB (after PHIs). |
| 785 | BB->insert(BBBegin, DbgMI); |
| 786 | else { |
Dan Gohman | a8dab36 | 2010-07-10 22:42:31 +0000 | [diff] [blame] | 787 | // Insert at the instruction, which may be in a different |
| 788 | // block, if the block was split by a custom inserter. |
Evan Cheng | 962021b | 2010-04-26 07:38:55 +0000 | [diff] [blame] | 789 | MachineBasicBlock::iterator Pos = MI; |
Dan Gohman | a8dab36 | 2010-07-10 22:42:31 +0000 | [diff] [blame] | 790 | MI->getParent()->insert(llvm::next(Pos), DbgMI); |
Evan Cheng | 962021b | 2010-04-26 07:38:55 +0000 | [diff] [blame] | 791 | } |
Evan Cheng | bfcb305 | 2010-03-25 01:38:16 +0000 | [diff] [blame] | 792 | } |
Dale Johannesen | bfdf7f3 | 2010-03-10 22:13:47 +0000 | [diff] [blame] | 793 | } |
Evan Cheng | bfcb305 | 2010-03-25 01:38:16 +0000 | [diff] [blame] | 794 | LastOrder = Order; |
Evan Cheng | bfcb305 | 2010-03-25 01:38:16 +0000 | [diff] [blame] | 795 | } |
| 796 | // Add trailing DbgValue's before the terminator. FIXME: May want to add |
| 797 | // some of them before one or more conditional branches? |
| 798 | while (DI != DE) { |
| 799 | MachineBasicBlock *InsertBB = Emitter.getBlock(); |
| 800 | MachineBasicBlock::iterator Pos= Emitter.getBlock()->getFirstTerminator(); |
| 801 | if (!(*DI)->isInvalidated()) { |
Dan Gohman | 891ff8f | 2010-04-30 19:35:33 +0000 | [diff] [blame] | 802 | MachineInstr *DbgMI= Emitter.EmitDbgValue(*DI, VRBaseMap); |
Evan Cheng | 962021b | 2010-04-26 07:38:55 +0000 | [diff] [blame] | 803 | if (DbgMI) |
| 804 | InsertBB->insert(Pos, DbgMI); |
Evan Cheng | bfcb305 | 2010-03-25 01:38:16 +0000 | [diff] [blame] | 805 | } |
| 806 | ++DI; |
| 807 | } |
Dan Gohman | bcea859 | 2009-10-10 01:32:21 +0000 | [diff] [blame] | 808 | } |
| 809 | |
| 810 | BB = Emitter.getBlock(); |
| 811 | InsertPos = Emitter.getInsertPos(); |
| 812 | return BB; |
| 813 | } |