blob: 5b6f72fbb35caeae7a1e1a56b01683a77ae505ea [file] [log] [blame]
Eugene Zelenkofa912a72017-02-27 22:45:06 +00001//===- llvm/Target/TargetSchedule.cpp - Sched Machine Model ---------------===//
Andrew Trickd2a19da2012-09-14 20:26:46 +00002//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10// This file implements a wrapper around MCSchedModel that allows the interface
11// to benefit from information currently only available in TargetInstrInfo.
12//
13//===----------------------------------------------------------------------===//
14
Chandler Carruth6bda14b2017-06-06 11:49:48 +000015#include "llvm/CodeGen/TargetSchedule.h"
Eugene Zelenkofa912a72017-02-27 22:45:06 +000016#include "llvm/CodeGen/MachineFunction.h"
17#include "llvm/CodeGen/MachineInstr.h"
18#include "llvm/CodeGen/MachineOperand.h"
David Blaikie3f833ed2017-11-08 01:01:31 +000019#include "llvm/CodeGen/TargetInstrInfo.h"
David Blaikieb3bde2e2017-11-17 01:07:10 +000020#include "llvm/CodeGen/TargetRegisterInfo.h"
21#include "llvm/CodeGen/TargetSubtargetInfo.h"
Eugene Zelenkofa912a72017-02-27 22:45:06 +000022#include "llvm/MC/MCInstrDesc.h"
23#include "llvm/MC/MCInstrItineraries.h"
24#include "llvm/MC/MCSchedule.h"
Chandler Carruthed0881b2012-12-03 16:50:05 +000025#include "llvm/Support/CommandLine.h"
Eugene Zelenkofa912a72017-02-27 22:45:06 +000026#include "llvm/Support/ErrorHandling.h"
Chandler Carruthed0881b2012-12-03 16:50:05 +000027#include "llvm/Support/raw_ostream.h"
Eugene Zelenkofa912a72017-02-27 22:45:06 +000028#include <algorithm>
29#include <cassert>
30#include <cstdint>
Andrew Trickd2a19da2012-09-14 20:26:46 +000031
32using namespace llvm;
33
Andrew Trick8abcf4d2012-10-04 00:24:34 +000034static cl::opt<bool> EnableSchedModel("schedmodel", cl::Hidden, cl::init(true),
Andrew Trickd2a19da2012-09-14 20:26:46 +000035 cl::desc("Use TargetSchedModel for latency lookup"));
36
Andrew Trick6e6d5972012-09-18 04:03:34 +000037static cl::opt<bool> EnableSchedItins("scheditins", cl::Hidden, cl::init(true),
38 cl::desc("Use InstrItineraryData for latency lookup"));
39
Andrew Trickcfcf5202012-10-09 23:44:26 +000040bool TargetSchedModel::hasInstrSchedModel() const {
41 return EnableSchedModel && SchedModel.hasInstrSchedModel();
42}
43
44bool TargetSchedModel::hasInstrItineraries() const {
45 return EnableSchedItins && !InstrItins.isEmpty();
46}
47
Andrew Tricke96390e2012-11-06 07:10:38 +000048static unsigned gcd(unsigned Dividend, unsigned Divisor) {
49 // Dividend and Divisor will be naturally swapped as needed.
Eugene Zelenkofa912a72017-02-27 22:45:06 +000050 while (Divisor) {
Andrew Tricke96390e2012-11-06 07:10:38 +000051 unsigned Rem = Dividend % Divisor;
52 Dividend = Divisor;
53 Divisor = Rem;
54 };
55 return Dividend;
56}
Eugene Zelenkofa912a72017-02-27 22:45:06 +000057
Andrew Tricke96390e2012-11-06 07:10:38 +000058static unsigned lcm(unsigned A, unsigned B) {
59 unsigned LCM = (uint64_t(A) * B) / gcd(A, B);
60 assert((LCM >= A && LCM >= B) && "LCM overflow");
61 return LCM;
62}
63
Sanjay Patel0d7df362018-04-08 19:56:04 +000064void TargetSchedModel::init(const TargetSubtargetInfo *TSInfo) {
65 STI = TSInfo;
66 SchedModel = TSInfo->getSchedModel();
67 TII = TSInfo->getInstrInfo();
Andrew Trickd2a19da2012-09-14 20:26:46 +000068 STI->initInstrItins(InstrItins);
Andrew Tricke96390e2012-11-06 07:10:38 +000069
70 unsigned NumRes = SchedModel.getNumProcResourceKinds();
71 ResourceFactors.resize(NumRes);
72 ResourceLCM = SchedModel.IssueWidth;
73 for (unsigned Idx = 0; Idx < NumRes; ++Idx) {
74 unsigned NumUnits = SchedModel.getProcResource(Idx)->NumUnits;
75 if (NumUnits > 0)
76 ResourceLCM = lcm(ResourceLCM, NumUnits);
77 }
78 MicroOpFactor = ResourceLCM / SchedModel.IssueWidth;
79 for (unsigned Idx = 0; Idx < NumRes; ++Idx) {
80 unsigned NumUnits = SchedModel.getProcResource(Idx)->NumUnits;
81 ResourceFactors[Idx] = NumUnits ? (ResourceLCM / NumUnits) : 0;
82 }
Andrew Trickd2a19da2012-09-14 20:26:46 +000083}
Andrew Trick6e6d5972012-09-18 04:03:34 +000084
Javed Absar3d594372017-03-27 20:46:37 +000085/// Returns true only if instruction is specified as single issue.
86bool TargetSchedModel::mustBeginGroup(const MachineInstr *MI,
87 const MCSchedClassDesc *SC) const {
88 if (hasInstrSchedModel()) {
89 if (!SC)
90 SC = resolveSchedClass(MI);
91 if (SC->isValid())
92 return SC->BeginGroup;
93 }
94 return false;
95}
96
97bool TargetSchedModel::mustEndGroup(const MachineInstr *MI,
98 const MCSchedClassDesc *SC) const {
99 if (hasInstrSchedModel()) {
100 if (!SC)
101 SC = resolveSchedClass(MI);
102 if (SC->isValid())
103 return SC->EndGroup;
104 }
105 return false;
106}
107
Andrew Tricke96390e2012-11-06 07:10:38 +0000108unsigned TargetSchedModel::getNumMicroOps(const MachineInstr *MI,
109 const MCSchedClassDesc *SC) const {
Andrew Trickdd79f0f2012-10-10 05:43:09 +0000110 if (hasInstrItineraries()) {
111 int UOps = InstrItins.getNumMicroOps(MI->getDesc().getSchedClass());
Duncan P. N. Exon Smith9cfc75c2016-06-30 00:01:54 +0000112 return (UOps >= 0) ? UOps : TII->getNumMicroOps(&InstrItins, *MI);
Andrew Trickdd79f0f2012-10-10 05:43:09 +0000113 }
Andrew Trick5f35afb2012-10-11 05:37:06 +0000114 if (hasInstrSchedModel()) {
Andrew Tricke96390e2012-11-06 07:10:38 +0000115 if (!SC)
116 SC = resolveSchedClass(MI);
117 if (SC->isValid())
118 return SC->NumMicroOps;
Andrew Trick5f35afb2012-10-11 05:37:06 +0000119 }
120 return MI->isTransient() ? 0 : 1;
Andrew Trickdd79f0f2012-10-10 05:43:09 +0000121}
122
Andrew Trick0b1d8d02012-10-17 17:27:10 +0000123// The machine model may explicitly specify an invalid latency, which
124// effectively means infinite latency. Since users of the TargetSchedule API
125// don't know how to handle this, we convert it to a very large latency that is
126// easy to distinguish when debugging the DAG but won't induce overflow.
Andrew Trickde2109e2013-06-15 04:49:57 +0000127static unsigned capLatency(int Cycles) {
Andrew Trick0b1d8d02012-10-17 17:27:10 +0000128 return Cycles >= 0 ? Cycles : 1000;
129}
130
Andrew Trick6e6d5972012-09-18 04:03:34 +0000131/// Return the MCSchedClassDesc for this instruction. Some SchedClasses require
132/// evaluation of predicates that depend on instruction operands or flags.
133const MCSchedClassDesc *TargetSchedModel::
134resolveSchedClass(const MachineInstr *MI) const {
Andrew Trick6e6d5972012-09-18 04:03:34 +0000135 // Get the definition's scheduling class descriptor from this machine model.
136 unsigned SchedClass = MI->getDesc().getSchedClass();
137 const MCSchedClassDesc *SCDesc = SchedModel.getSchedClassDesc(SchedClass);
Andrew Trickbe2bccb2013-04-13 06:07:45 +0000138 if (!SCDesc->isValid())
139 return SCDesc;
Andrew Trick6e6d5972012-09-18 04:03:34 +0000140
141#ifndef NDEBUG
142 unsigned NIter = 0;
143#endif
144 while (SCDesc->isVariant()) {
145 assert(++NIter < 6 && "Variants are nested deeper than the magic number");
146
147 SchedClass = STI->resolveSchedClass(SchedClass, MI, this);
148 SCDesc = SchedModel.getSchedClassDesc(SchedClass);
149 }
150 return SCDesc;
151}
152
153/// Find the def index of this operand. This index maps to the machine model and
154/// is independent of use operands. Def operands may be reordered with uses or
155/// merged with uses without affecting the def index (e.g. before/after
156/// regalloc). However, an instruction's def operands must never be reordered
157/// with respect to each other.
158static unsigned findDefIdx(const MachineInstr *MI, unsigned DefOperIdx) {
159 unsigned DefIdx = 0;
160 for (unsigned i = 0; i != DefOperIdx; ++i) {
161 const MachineOperand &MO = MI->getOperand(i);
162 if (MO.isReg() && MO.isDef())
163 ++DefIdx;
164 }
165 return DefIdx;
166}
167
168/// Find the use index of this operand. This is independent of the instruction's
169/// def operands.
Andrew Trickf2b70d92012-09-18 18:20:02 +0000170///
171/// Note that uses are not determined by the operand's isUse property, which
172/// is simply the inverse of isDef. Here we consider any readsReg operand to be
173/// a "use". The machine model allows an operand to be both a Def and Use.
Andrew Trick6e6d5972012-09-18 04:03:34 +0000174static unsigned findUseIdx(const MachineInstr *MI, unsigned UseOperIdx) {
175 unsigned UseIdx = 0;
176 for (unsigned i = 0; i != UseOperIdx; ++i) {
177 const MachineOperand &MO = MI->getOperand(i);
Matthias Braun3a133152016-08-24 02:32:29 +0000178 if (MO.isReg() && MO.readsReg() && !MO.isDef())
Andrew Trick6e6d5972012-09-18 04:03:34 +0000179 ++UseIdx;
180 }
181 return UseIdx;
182}
183
184// Top-level API for clients that know the operand indices.
185unsigned TargetSchedModel::computeOperandLatency(
186 const MachineInstr *DefMI, unsigned DefOperIdx,
Andrew Trickde2109e2013-06-15 04:49:57 +0000187 const MachineInstr *UseMI, unsigned UseOperIdx) const {
Andrew Trick6e6d5972012-09-18 04:03:34 +0000188
Andrew Trickde2109e2013-06-15 04:49:57 +0000189 if (!hasInstrSchedModel() && !hasInstrItineraries())
Duncan P. N. Exon Smith9cfc75c2016-06-30 00:01:54 +0000190 return TII->defaultDefLatency(SchedModel, *DefMI);
Andrew Trick6e6d5972012-09-18 04:03:34 +0000191
Andrew Trickcfcf5202012-10-09 23:44:26 +0000192 if (hasInstrItineraries()) {
Andrew Trick8abcf4d2012-10-04 00:24:34 +0000193 int OperLatency = 0;
194 if (UseMI) {
Duncan P. N. Exon Smith9cfc75c2016-06-30 00:01:54 +0000195 OperLatency = TII->getOperandLatency(&InstrItins, *DefMI, DefOperIdx,
196 *UseMI, UseOperIdx);
Andrew Trick6e6d5972012-09-18 04:03:34 +0000197 }
Andrew Trick8abcf4d2012-10-04 00:24:34 +0000198 else {
199 unsigned DefClass = DefMI->getDesc().getSchedClass();
200 OperLatency = InstrItins.getOperandCycle(DefClass, DefOperIdx);
201 }
202 if (OperLatency >= 0)
203 return OperLatency;
204
205 // No operand latency was found.
Duncan P. N. Exon Smith9cfc75c2016-06-30 00:01:54 +0000206 unsigned InstrLatency = TII->getInstrLatency(&InstrItins, *DefMI);
Andrew Trick8abcf4d2012-10-04 00:24:34 +0000207
208 // Expected latency is the max of the stage latency and itinerary props.
Andrew Trick780fae82012-10-09 23:44:32 +0000209 // Rather than directly querying InstrItins stage latency, we call a TII
210 // hook to allow subtargets to specialize latency. This hook is only
211 // applicable to the InstrItins model. InstrSchedModel should model all
212 // special cases without TII hooks.
Duncan P. N. Exon Smith9cfc75c2016-06-30 00:01:54 +0000213 InstrLatency =
214 std::max(InstrLatency, TII->defaultDefLatency(SchedModel, *DefMI));
Andrew Trick8abcf4d2012-10-04 00:24:34 +0000215 return InstrLatency;
216 }
Andrew Trickde2109e2013-06-15 04:49:57 +0000217 // hasInstrSchedModel()
Andrew Trick8abcf4d2012-10-04 00:24:34 +0000218 const MCSchedClassDesc *SCDesc = resolveSchedClass(DefMI);
219 unsigned DefIdx = findDefIdx(DefMI, DefOperIdx);
220 if (DefIdx < SCDesc->NumWriteLatencyEntries) {
221 // Lookup the definition's write latency in SubtargetInfo.
222 const MCWriteLatencyEntry *WLEntry =
223 STI->getWriteLatencyEntry(SCDesc, DefIdx);
224 unsigned WriteID = WLEntry->WriteResourceID;
Andrew Trickde2109e2013-06-15 04:49:57 +0000225 unsigned Latency = capLatency(WLEntry->Cycles);
Andrew Trick8abcf4d2012-10-04 00:24:34 +0000226 if (!UseMI)
227 return Latency;
228
229 // Lookup the use's latency adjustment in SubtargetInfo.
230 const MCSchedClassDesc *UseDesc = resolveSchedClass(UseMI);
231 if (UseDesc->NumReadAdvanceEntries == 0)
232 return Latency;
233 unsigned UseIdx = findUseIdx(UseMI, UseOperIdx);
Andrew Trick5d4861862013-06-17 21:45:18 +0000234 int Advance = STI->getReadAdvanceCycles(UseDesc, UseIdx, WriteID);
235 if (Advance > 0 && (unsigned)Advance > Latency) // unsigned wrap
236 return 0;
237 return Latency - Advance;
Andrew Trick8abcf4d2012-10-04 00:24:34 +0000238 }
239 // If DefIdx does not exist in the model (e.g. implicit defs), then return
240 // unit latency (defaultDefLatency may be too conservative).
Andrew Trickf2b70d92012-09-18 18:20:02 +0000241#ifndef NDEBUG
Andrew Trick8abcf4d2012-10-04 00:24:34 +0000242 if (SCDesc->isValid() && !DefMI->getOperand(DefOperIdx).isImplicit()
Andrew Trickb6854d82013-09-25 18:14:12 +0000243 && !DefMI->getDesc().OpInfo[DefOperIdx].isOptionalDef()
244 && SchedModel.isComplete()) {
Matthias Braun244a6772015-07-17 17:50:11 +0000245 errs() << "DefIdx " << DefIdx << " exceeds machine model writes for "
MinSeong Kim4a9a4e12016-01-05 14:50:15 +0000246 << *DefMI << " (Try with MCSchedModel.CompleteModel set to false)";
Matthias Braun244a6772015-07-17 17:50:11 +0000247 llvm_unreachable("incomplete machine model");
Andrew Trick8abcf4d2012-10-04 00:24:34 +0000248 }
Andrew Trickf2b70d92012-09-18 18:20:02 +0000249#endif
Andrew Trick60570172013-03-16 18:58:57 +0000250 // FIXME: Automatically giving all implicit defs defaultDefLatency is
251 // undesirable. We should only do it for defs that are known to the MC
252 // desc like flags. Truly implicit defs should get 1 cycle latency.
Duncan P. N. Exon Smith9cfc75c2016-06-30 00:01:54 +0000253 return DefMI->isTransient() ? 0 : TII->defaultDefLatency(SchedModel, *DefMI);
Andrew Trick6e6d5972012-09-18 04:03:34 +0000254}
Andrew Trick780fae82012-10-09 23:44:32 +0000255
Matthias Braun42e1e662015-05-14 18:01:13 +0000256unsigned
257TargetSchedModel::computeInstrLatency(const MCSchedClassDesc &SCDesc) const {
Andrea Di Biagio30c1ba42018-03-13 15:22:13 +0000258 return capLatency(MCSchedModel::computeInstrLatency(*STI, SCDesc));
Matthias Braun42e1e662015-05-14 18:01:13 +0000259}
260
Gerolf Hoflehner5e1207e2014-08-03 21:35:39 +0000261unsigned TargetSchedModel::computeInstrLatency(unsigned Opcode) const {
262 assert(hasInstrSchedModel() && "Only call this function with a SchedModel");
Gerolf Hoflehner5e1207e2014-08-03 21:35:39 +0000263 unsigned SCIdx = TII->get(Opcode).getSchedClass();
Andrea Di Biagiob9acf132018-04-15 17:32:17 +0000264 return SchedModel.computeInstrLatency(*STI, SCIdx);
Gerolf Hoflehner5e1207e2014-08-03 21:35:39 +0000265}
266
Arnold Schwaighoferd2f96b92013-09-30 15:28:56 +0000267unsigned
268TargetSchedModel::computeInstrLatency(const MachineInstr *MI,
269 bool UseDefaultDefLatency) const {
Andrew Trickc334bd42012-10-10 05:43:18 +0000270 // For the itinerary model, fall back to the old subtarget hook.
271 // Allow subtargets to compute Bundle latencies outside the machine model.
Arnold Schwaighoferd2f96b92013-09-30 15:28:56 +0000272 if (hasInstrItineraries() || MI->isBundle() ||
273 (!hasInstrSchedModel() && !UseDefaultDefLatency))
Duncan P. N. Exon Smith9cfc75c2016-06-30 00:01:54 +0000274 return TII->getInstrLatency(&InstrItins, *MI);
Andrew Trickc334bd42012-10-10 05:43:18 +0000275
Andrew Trick780fae82012-10-09 23:44:32 +0000276 if (hasInstrSchedModel()) {
Andrew Trick780fae82012-10-09 23:44:32 +0000277 const MCSchedClassDesc *SCDesc = resolveSchedClass(MI);
Matthias Braun42e1e662015-05-14 18:01:13 +0000278 if (SCDesc->isValid())
279 return computeInstrLatency(*SCDesc);
Andrew Trick780fae82012-10-09 23:44:32 +0000280 }
Duncan P. N. Exon Smith9cfc75c2016-06-30 00:01:54 +0000281 return TII->defaultDefLatency(SchedModel, *MI);
Andrew Trick780fae82012-10-09 23:44:32 +0000282}
Andrew Trickdd79f0f2012-10-10 05:43:09 +0000283
284unsigned TargetSchedModel::
285computeOutputLatency(const MachineInstr *DefMI, unsigned DefOperIdx,
286 const MachineInstr *DepMI) const {
Junmo Park11811922016-06-21 08:09:58 +0000287 if (!SchedModel.isOutOfOrder())
Andrew Trickdd79f0f2012-10-10 05:43:09 +0000288 return 1;
289
Junmo Park11811922016-06-21 08:09:58 +0000290 // Out-of-order processor can dispatch WAW dependencies in the same cycle.
Andrew Trickdd79f0f2012-10-10 05:43:09 +0000291
292 // Treat predication as a data dependency for out-of-order cpus. In-order
293 // cpus do not need to treat predicated writes specially.
294 //
295 // TODO: The following hack exists because predication passes do not
296 // correctly append imp-use operands, and readsReg() strangely returns false
297 // for predicated defs.
298 unsigned Reg = DefMI->getOperand(DefOperIdx).getReg();
Justin Bognerfdf9bf42017-10-10 23:50:49 +0000299 const MachineFunction &MF = *DefMI->getMF();
Eric Christopherfc6de422014-08-05 02:39:49 +0000300 const TargetRegisterInfo *TRI = MF.getSubtarget().getRegisterInfo();
Duncan P. N. Exon Smith6307eb52016-02-23 02:46:52 +0000301 if (!DepMI->readsRegister(Reg, TRI) && TII->isPredicated(*DepMI))
Andrew Trickdd79f0f2012-10-10 05:43:09 +0000302 return computeInstrLatency(DefMI);
303
304 // If we have a per operand scheduling model, check if this def is writing
305 // an unbuffered resource. If so, it treated like an in-order cpu.
306 if (hasInstrSchedModel()) {
307 const MCSchedClassDesc *SCDesc = resolveSchedClass(DefMI);
Andrew Trick5f35afb2012-10-11 05:37:06 +0000308 if (SCDesc->isValid()) {
309 for (const MCWriteProcResEntry *PRI = STI->getWriteProcResBegin(SCDesc),
310 *PRE = STI->getWriteProcResEnd(SCDesc); PRI != PRE; ++PRI) {
Andrew Trickde2109e2013-06-15 04:49:57 +0000311 if (!SchedModel.getProcResource(PRI->ProcResourceIdx)->BufferSize)
Andrew Trick5f35afb2012-10-11 05:37:06 +0000312 return 1;
313 }
Andrew Trickdd79f0f2012-10-10 05:43:09 +0000314 }
315 }
316 return 0;
317}
Andrew V. Tischenko75745d02017-04-14 07:44:23 +0000318
Andrew V. Tischenko75745d02017-04-14 07:44:23 +0000319Optional<double>
Andrea Di Biagiob9acf132018-04-15 17:32:17 +0000320TargetSchedModel::computeReciprocalThroughput(const MachineInstr *MI) const {
321 if (hasInstrItineraries()) {
322 unsigned SchedClass = MI->getDesc().getSchedClass();
323 return MCSchedModel::getReciprocalThroughput(SchedClass,
324 *getInstrItineraries());
325 }
326
Andrew V. Tischenko75745d02017-04-14 07:44:23 +0000327 if (hasInstrSchedModel())
Andrea Di Biagio7faea7c2018-03-13 16:28:55 +0000328 return MCSchedModel::getReciprocalThroughput(*STI, *resolveSchedClass(MI));
Andrew V. Tischenko75745d02017-04-14 07:44:23 +0000329 return Optional<double>();
330}
331
332Optional<double>
Andrea Di Biagiob9acf132018-04-15 17:32:17 +0000333TargetSchedModel::computeReciprocalThroughput(unsigned Opcode) const {
Andrew V. Tischenko75745d02017-04-14 07:44:23 +0000334 unsigned SchedClass = TII->get(Opcode).getSchedClass();
335 if (hasInstrItineraries())
Andrea Di Biagiob9acf132018-04-15 17:32:17 +0000336 return MCSchedModel::getReciprocalThroughput(SchedClass,
337 *getInstrItineraries());
Andrew V. Tischenko75745d02017-04-14 07:44:23 +0000338 if (hasInstrSchedModel()) {
Andrea Di Biagio7faea7c2018-03-13 16:28:55 +0000339 const MCSchedClassDesc &SCDesc = *SchedModel.getSchedClassDesc(SchedClass);
340 if (SCDesc.isValid() && !SCDesc.isVariant())
341 return MCSchedModel::getReciprocalThroughput(*STI, SCDesc);
Andrew V. Tischenko75745d02017-04-14 07:44:23 +0000342 }
343 return Optional<double>();
344}