blob: 6e1146e3a9d5357be5781542c6f32aba695ad4b4 [file] [log] [blame]
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +00001//===--------------------- InstrBuilder.cpp ---------------------*- C++ -*-===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9/// \file
10///
11/// This file implements the InstrBuilder interface.
12///
13//===----------------------------------------------------------------------===//
14
15#include "InstrBuilder.h"
Andrea Di Biagio2145b132018-06-20 10:08:11 +000016#include "llvm/ADT/APInt.h"
Andrea Di Biagio2008c7c2018-06-04 12:23:07 +000017#include "llvm/ADT/DenseMap.h"
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +000018#include "llvm/MC/MCInst.h"
19#include "llvm/Support/Debug.h"
Andrea Di Biagio24fb4fc2018-05-04 13:52:12 +000020#include "llvm/Support/WithColor.h"
Andrea Di Biagio88347792018-07-09 12:30:55 +000021#include "llvm/Support/raw_ostream.h"
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +000022
23#define DEBUG_TYPE "llvm-mca"
24
25namespace mca {
26
27using namespace llvm;
28
Andrea Di Biagio94fafdf2018-03-24 16:05:36 +000029static void initializeUsedResources(InstrDesc &ID,
30 const MCSchedClassDesc &SCDesc,
31 const MCSubtargetInfo &STI,
32 ArrayRef<uint64_t> ProcResourceMasks) {
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +000033 const MCSchedModel &SM = STI.getSchedModel();
34
35 // Populate resources consumed.
36 using ResourcePlusCycles = std::pair<uint64_t, ResourceUsage>;
37 std::vector<ResourcePlusCycles> Worklist;
Andrea Di Biagio2008c7c2018-06-04 12:23:07 +000038
39 // Track cycles contributed by resources that are in a "Super" relationship.
40 // This is required if we want to correctly match the behavior of method
41 // SubtargetEmitter::ExpandProcResource() in Tablegen. When computing the set
42 // of "consumed" processor resources and resource cycles, the logic in
43 // ExpandProcResource() doesn't update the number of resource cycles
44 // contributed by a "Super" resource to a group.
45 // We need to take this into account when we find that a processor resource is
46 // part of a group, and it is also used as the "Super" of other resources.
47 // This map stores the number of cycles contributed by sub-resources that are
48 // part of a "Super" resource. The key value is the "Super" resource mask ID.
49 DenseMap<uint64_t, unsigned> SuperResources;
50
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +000051 for (unsigned I = 0, E = SCDesc.NumWriteProcResEntries; I < E; ++I) {
52 const MCWriteProcResEntry *PRE = STI.getWriteProcResBegin(&SCDesc) + I;
53 const MCProcResourceDesc &PR = *SM.getProcResource(PRE->ProcResourceIdx);
54 uint64_t Mask = ProcResourceMasks[PRE->ProcResourceIdx];
55 if (PR.BufferSize != -1)
56 ID.Buffers.push_back(Mask);
57 CycleSegment RCy(0, PRE->Cycles, false);
58 Worklist.emplace_back(ResourcePlusCycles(Mask, ResourceUsage(RCy)));
Andrea Di Biagio2008c7c2018-06-04 12:23:07 +000059 if (PR.SuperIdx) {
60 uint64_t Super = ProcResourceMasks[PR.SuperIdx];
61 SuperResources[Super] += PRE->Cycles;
62 }
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +000063 }
64
65 // Sort elements by mask popcount, so that we prioritize resource units over
66 // resource groups, and smaller groups over larger groups.
Mandeep Singh Grang8db564e2018-04-01 21:24:53 +000067 llvm::sort(Worklist.begin(), Worklist.end(),
68 [](const ResourcePlusCycles &A, const ResourcePlusCycles &B) {
69 unsigned popcntA = countPopulation(A.first);
70 unsigned popcntB = countPopulation(B.first);
71 if (popcntA < popcntB)
72 return true;
73 if (popcntA > popcntB)
74 return false;
75 return A.first < B.first;
76 });
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +000077
78 uint64_t UsedResourceUnits = 0;
79
80 // Remove cycles contributed by smaller resources.
81 for (unsigned I = 0, E = Worklist.size(); I < E; ++I) {
82 ResourcePlusCycles &A = Worklist[I];
83 if (!A.second.size()) {
84 A.second.NumUnits = 0;
85 A.second.setReserved();
86 ID.Resources.emplace_back(A);
87 continue;
88 }
89
90 ID.Resources.emplace_back(A);
91 uint64_t NormalizedMask = A.first;
92 if (countPopulation(A.first) == 1) {
93 UsedResourceUnits |= A.first;
94 } else {
95 // Remove the leading 1 from the resource group mask.
96 NormalizedMask ^= PowerOf2Floor(NormalizedMask);
97 }
98
99 for (unsigned J = I + 1; J < E; ++J) {
100 ResourcePlusCycles &B = Worklist[J];
101 if ((NormalizedMask & B.first) == NormalizedMask) {
Andrea Di Biagio2008c7c2018-06-04 12:23:07 +0000102 B.second.CS.Subtract(A.second.size() - SuperResources[A.first]);
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +0000103 if (countPopulation(B.first) > 1)
104 B.second.NumUnits++;
105 }
106 }
107 }
108
109 // A SchedWrite may specify a number of cycles in which a resource group
110 // is reserved. For example (on target x86; cpu Haswell):
111 //
112 // SchedWriteRes<[HWPort0, HWPort1, HWPort01]> {
113 // let ResourceCycles = [2, 2, 3];
114 // }
115 //
116 // This means:
117 // Resource units HWPort0 and HWPort1 are both used for 2cy.
118 // Resource group HWPort01 is the union of HWPort0 and HWPort1.
119 // Since this write touches both HWPort0 and HWPort1 for 2cy, HWPort01
120 // will not be usable for 2 entire cycles from instruction issue.
121 //
122 // On top of those 2cy, SchedWriteRes explicitly specifies an extra latency
123 // of 3 cycles for HWPort01. This tool assumes that the 3cy latency is an
124 // extra delay on top of the 2 cycles latency.
125 // During those extra cycles, HWPort01 is not usable by other instructions.
126 for (ResourcePlusCycles &RPC : ID.Resources) {
127 if (countPopulation(RPC.first) > 1 && !RPC.second.isReserved()) {
128 // Remove the leading 1 from the resource group mask.
129 uint64_t Mask = RPC.first ^ PowerOf2Floor(RPC.first);
130 if ((Mask & UsedResourceUnits) == Mask)
131 RPC.second.setReserved();
132 }
133 }
134
Nicola Zaghend34e60c2018-05-14 12:53:11 +0000135 LLVM_DEBUG({
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +0000136 for (const std::pair<uint64_t, ResourceUsage> &R : ID.Resources)
137 dbgs() << "\t\tMask=" << R.first << ", cy=" << R.second.size() << '\n';
138 for (const uint64_t R : ID.Buffers)
139 dbgs() << "\t\tBuffer Mask=" << R << '\n';
Andrea Di Biagio7b3d1622018-03-20 12:58:34 +0000140 });
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +0000141}
142
143static void computeMaxLatency(InstrDesc &ID, const MCInstrDesc &MCDesc,
144 const MCSchedClassDesc &SCDesc,
145 const MCSubtargetInfo &STI) {
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +0000146 if (MCDesc.isCall()) {
147 // We cannot estimate how long this call will take.
148 // Artificially set an arbitrarily high latency (100cy).
Andrea Di Biagioc95a1302018-03-13 15:59:59 +0000149 ID.MaxLatency = 100U;
150 return;
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +0000151 }
152
Andrea Di Biagioc95a1302018-03-13 15:59:59 +0000153 int Latency = MCSchedModel::computeInstrLatency(STI, SCDesc);
154 // If latency is unknown, then conservatively assume a MaxLatency of 100cy.
155 ID.MaxLatency = Latency < 0 ? 100U : static_cast<unsigned>(Latency);
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +0000156}
157
Matt Davis4bcf3692018-08-13 18:11:48 +0000158Error InstrBuilder::populateWrites(InstrDesc &ID, const MCInst &MCI,
159 unsigned SchedClassID) {
Andrea Di Biagio88347792018-07-09 12:30:55 +0000160 const MCInstrDesc &MCDesc = MCII.get(MCI.getOpcode());
161 const MCSchedModel &SM = STI.getSchedModel();
162 const MCSchedClassDesc &SCDesc = *SM.getSchedClassDesc(SchedClassID);
163
Andrea Di Biagioace775e2018-06-21 12:14:49 +0000164 // These are for now the (strong) assumptions made by this algorithm:
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +0000165 // * The number of explicit and implicit register definitions in a MCInst
166 // matches the number of explicit and implicit definitions according to
167 // the opcode descriptor (MCInstrDesc).
168 // * Register definitions take precedence over register uses in the operands
169 // list.
170 // * If an opcode specifies an optional definition, then the optional
171 // definition is always the last operand in the sequence, and it can be
172 // set to zero (i.e. "no register").
173 //
174 // These assumptions work quite well for most out-of-order in-tree targets
175 // like x86. This is mainly because the vast majority of instructions is
176 // expanded to MCInst using a straightforward lowering logic that preserves
177 // the ordering of the operands.
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +0000178 unsigned NumExplicitDefs = MCDesc.getNumDefs();
179 unsigned NumImplicitDefs = MCDesc.getNumImplicitDefs();
180 unsigned NumWriteLatencyEntries = SCDesc.NumWriteLatencyEntries;
181 unsigned TotalDefs = NumExplicitDefs + NumImplicitDefs;
182 if (MCDesc.hasOptionalDef())
183 TotalDefs++;
184 ID.Writes.resize(TotalDefs);
185 // Iterate over the operands list, and skip non-register operands.
186 // The first NumExplictDefs register operands are expected to be register
187 // definitions.
188 unsigned CurrentDef = 0;
189 unsigned i = 0;
190 for (; i < MCI.getNumOperands() && CurrentDef < NumExplicitDefs; ++i) {
191 const MCOperand &Op = MCI.getOperand(i);
192 if (!Op.isReg())
193 continue;
194
195 WriteDescriptor &Write = ID.Writes[CurrentDef];
196 Write.OpIndex = i;
197 if (CurrentDef < NumWriteLatencyEntries) {
198 const MCWriteLatencyEntry &WLE =
199 *STI.getWriteLatencyEntry(&SCDesc, CurrentDef);
200 // Conservatively default to MaxLatency.
Andrea Di Biagio88347792018-07-09 12:30:55 +0000201 Write.Latency =
202 WLE.Cycles < 0 ? ID.MaxLatency : static_cast<unsigned>(WLE.Cycles);
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +0000203 Write.SClassOrWriteResourceID = WLE.WriteResourceID;
204 } else {
205 // Assign a default latency for this write.
206 Write.Latency = ID.MaxLatency;
207 Write.SClassOrWriteResourceID = 0;
208 }
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +0000209 Write.IsOptionalDef = false;
Nicola Zaghend34e60c2018-05-14 12:53:11 +0000210 LLVM_DEBUG({
Andrea Di Biagio23fbe7c2018-07-13 14:55:47 +0000211 dbgs() << "\t\t[Def] OpIdx=" << Write.OpIndex
212 << ", Latency=" << Write.Latency
Andrea Di Biagio7b3d1622018-03-20 12:58:34 +0000213 << ", WriteResourceID=" << Write.SClassOrWriteResourceID << '\n';
214 });
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +0000215 CurrentDef++;
216 }
217
Matt Davis4bcf3692018-08-13 18:11:48 +0000218 if (CurrentDef != NumExplicitDefs) {
219 return make_error<StringError>(
220 "error: Expected more register operand definitions.",
221 inconvertibleErrorCode());
222 }
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +0000223
224 CurrentDef = 0;
225 for (CurrentDef = 0; CurrentDef < NumImplicitDefs; ++CurrentDef) {
226 unsigned Index = NumExplicitDefs + CurrentDef;
227 WriteDescriptor &Write = ID.Writes[Index];
Andrea Di Biagio21f0fdb2018-06-22 16:37:05 +0000228 Write.OpIndex = ~CurrentDef;
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +0000229 Write.RegisterID = MCDesc.getImplicitDefs()[CurrentDef];
Andrea Di Biagio6fd62fe2018-04-02 13:46:49 +0000230 if (Index < NumWriteLatencyEntries) {
231 const MCWriteLatencyEntry &WLE =
232 *STI.getWriteLatencyEntry(&SCDesc, Index);
233 // Conservatively default to MaxLatency.
Andrea Di Biagio88347792018-07-09 12:30:55 +0000234 Write.Latency =
235 WLE.Cycles < 0 ? ID.MaxLatency : static_cast<unsigned>(WLE.Cycles);
Andrea Di Biagio6fd62fe2018-04-02 13:46:49 +0000236 Write.SClassOrWriteResourceID = WLE.WriteResourceID;
237 } else {
238 // Assign a default latency for this write.
239 Write.Latency = ID.MaxLatency;
240 Write.SClassOrWriteResourceID = 0;
241 }
242
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +0000243 Write.IsOptionalDef = false;
244 assert(Write.RegisterID != 0 && "Expected a valid phys register!");
Andrea Di Biagio23fbe7c2018-07-13 14:55:47 +0000245 LLVM_DEBUG({
246 dbgs() << "\t\t[Def] OpIdx=" << Write.OpIndex
247 << ", PhysReg=" << MRI.getName(Write.RegisterID)
248 << ", Latency=" << Write.Latency
249 << ", WriteResourceID=" << Write.SClassOrWriteResourceID << '\n';
250 });
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +0000251 }
252
253 if (MCDesc.hasOptionalDef()) {
254 // Always assume that the optional definition is the last operand of the
255 // MCInst sequence.
256 const MCOperand &Op = MCI.getOperand(MCI.getNumOperands() - 1);
257 if (i == MCI.getNumOperands() || !Op.isReg())
Matt Davis4bcf3692018-08-13 18:11:48 +0000258 return make_error<StringError>(
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +0000259 "error: expected a register operand for an optional "
Matt Davis4bcf3692018-08-13 18:11:48 +0000260 "definition. Instruction has not be correctly analyzed.",
261 inconvertibleErrorCode());
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +0000262
263 WriteDescriptor &Write = ID.Writes[TotalDefs - 1];
264 Write.OpIndex = MCI.getNumOperands() - 1;
265 // Assign a default latency for this write.
266 Write.Latency = ID.MaxLatency;
267 Write.SClassOrWriteResourceID = 0;
268 Write.IsOptionalDef = true;
269 }
Matt Davis4bcf3692018-08-13 18:11:48 +0000270
271 return ErrorSuccess();
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +0000272}
273
Matt Davis4bcf3692018-08-13 18:11:48 +0000274Error InstrBuilder::populateReads(InstrDesc &ID, const MCInst &MCI,
275 unsigned SchedClassID) {
Andrea Di Biagio88347792018-07-09 12:30:55 +0000276 const MCInstrDesc &MCDesc = MCII.get(MCI.getOpcode());
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +0000277 unsigned NumExplicitDefs = MCDesc.getNumDefs();
Andrea Di Biagio88347792018-07-09 12:30:55 +0000278
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +0000279 // Skip explicit definitions.
Andrea Di Biagio88347792018-07-09 12:30:55 +0000280 unsigned i = 0;
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +0000281 for (; i < MCI.getNumOperands() && NumExplicitDefs; ++i) {
282 const MCOperand &Op = MCI.getOperand(i);
283 if (Op.isReg())
284 NumExplicitDefs--;
285 }
286
Matt Davis4bcf3692018-08-13 18:11:48 +0000287 if (NumExplicitDefs) {
288 return make_error<StringError>(
289 "error: Expected more register operand definitions. ",
290 inconvertibleErrorCode());
291 }
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +0000292
293 unsigned NumExplicitUses = MCI.getNumOperands() - i;
294 unsigned NumImplicitUses = MCDesc.getNumImplicitUses();
295 if (MCDesc.hasOptionalDef()) {
296 assert(NumExplicitUses);
297 NumExplicitUses--;
298 }
299 unsigned TotalUses = NumExplicitUses + NumImplicitUses;
300 if (!TotalUses)
Matt Davis4bcf3692018-08-13 18:11:48 +0000301 return ErrorSuccess();
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +0000302
303 ID.Reads.resize(TotalUses);
304 for (unsigned CurrentUse = 0; CurrentUse < NumExplicitUses; ++CurrentUse) {
305 ReadDescriptor &Read = ID.Reads[CurrentUse];
306 Read.OpIndex = i + CurrentUse;
Andrea Di Biagio0a837ef2018-03-29 14:26:56 +0000307 Read.UseIndex = CurrentUse;
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +0000308 Read.SchedClassID = SchedClassID;
Andrea Di Biagio23fbe7c2018-07-13 14:55:47 +0000309 LLVM_DEBUG(dbgs() << "\t\t[Use] OpIdx=" << Read.OpIndex
310 << ", UseIndex=" << Read.UseIndex << '\n');
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +0000311 }
312
313 for (unsigned CurrentUse = 0; CurrentUse < NumImplicitUses; ++CurrentUse) {
314 ReadDescriptor &Read = ID.Reads[NumExplicitUses + CurrentUse];
Andrea Di Biagio21f0fdb2018-06-22 16:37:05 +0000315 Read.OpIndex = ~CurrentUse;
Andrea Di Biagio6fd62fe2018-04-02 13:46:49 +0000316 Read.UseIndex = NumExplicitUses + CurrentUse;
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +0000317 Read.RegisterID = MCDesc.getImplicitUses()[CurrentUse];
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +0000318 Read.SchedClassID = SchedClassID;
Andrea Di Biagio23fbe7c2018-07-13 14:55:47 +0000319 LLVM_DEBUG(dbgs() << "\t\t[Use] OpIdx=" << Read.OpIndex << ", RegisterID="
320 << MRI.getName(Read.RegisterID) << '\n');
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +0000321 }
Matt Davis4bcf3692018-08-13 18:11:48 +0000322 return ErrorSuccess();
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +0000323}
324
Matt Davis4bcf3692018-08-13 18:11:48 +0000325Expected<const InstrDesc &>
326InstrBuilder::createInstrDescImpl(const MCInst &MCI) {
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +0000327 assert(STI.getSchedModel().hasInstrSchedModel() &&
328 "Itineraries are not yet supported!");
329
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +0000330 // Obtain the instruction descriptor from the opcode.
Andrea Di Biagio88347792018-07-09 12:30:55 +0000331 unsigned short Opcode = MCI.getOpcode();
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +0000332 const MCInstrDesc &MCDesc = MCII.get(Opcode);
333 const MCSchedModel &SM = STI.getSchedModel();
334
335 // Then obtain the scheduling class information from the instruction.
Andrea Di Biagio49c85912018-05-04 13:10:10 +0000336 unsigned SchedClassID = MCDesc.getSchedClass();
Andrea Di Biagio39e5a562018-06-04 15:43:09 +0000337 unsigned CPUID = SM.getProcessorID();
338
339 // Try to solve variant scheduling classes.
340 if (SchedClassID) {
341 while (SchedClassID && SM.getSchedClassDesc(SchedClassID)->isVariant())
342 SchedClassID = STI.resolveVariantSchedClass(SchedClassID, &MCI, CPUID);
343
Matt Davis4bcf3692018-08-13 18:11:48 +0000344 if (!SchedClassID) {
345 return make_error<StringError>("unable to resolve this variant class.",
346 inconvertibleErrorCode());
347 }
Andrea Di Biagio39e5a562018-06-04 15:43:09 +0000348 }
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +0000349
Matt Davis4bcf3692018-08-13 18:11:48 +0000350 // Check if this instruction is supported. Otherwise, report an error.
Andrea Di Biagio88347792018-07-09 12:30:55 +0000351 const MCSchedClassDesc &SCDesc = *SM.getSchedClassDesc(SchedClassID);
352 if (SCDesc.NumMicroOps == MCSchedClassDesc::InvalidNumMicroOps) {
353 std::string ToString;
354 llvm::raw_string_ostream OS(ToString);
355 WithColor::error() << "found an unsupported instruction in the input"
356 << " assembly sequence.\n";
357 MCIP.printInst(&MCI, OS, "", STI);
358 OS.flush();
Andrea Di Biagio88347792018-07-09 12:30:55 +0000359 WithColor::note() << "instruction: " << ToString << '\n';
Matt Davis4bcf3692018-08-13 18:11:48 +0000360 return make_error<StringError>(
361 "Don't know how to analyze unsupported instructions",
362 inconvertibleErrorCode());
Andrea Di Biagio88347792018-07-09 12:30:55 +0000363 }
364
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +0000365 // Create a new empty descriptor.
Andrea Di Biagio7b3d1622018-03-20 12:58:34 +0000366 std::unique_ptr<InstrDesc> ID = llvm::make_unique<InstrDesc>();
Andrea Di Biagio39e5a562018-06-04 15:43:09 +0000367 ID->NumMicroOps = SCDesc.NumMicroOps;
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +0000368
369 if (MCDesc.isCall()) {
370 // We don't correctly model calls.
Andrea Di Biagio24fb4fc2018-05-04 13:52:12 +0000371 WithColor::warning() << "found a call in the input assembly sequence.\n";
372 WithColor::note() << "call instructions are not correctly modeled. "
373 << "Assume a latency of 100cy.\n";
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +0000374 }
375
376 if (MCDesc.isReturn()) {
Andrea Di Biagio24fb4fc2018-05-04 13:52:12 +0000377 WithColor::warning() << "found a return instruction in the input"
378 << " assembly sequence.\n";
379 WithColor::note() << "program counter updates are ignored.\n";
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +0000380 }
381
382 ID->MayLoad = MCDesc.mayLoad();
383 ID->MayStore = MCDesc.mayStore();
384 ID->HasSideEffects = MCDesc.hasUnmodeledSideEffects();
385
386 initializeUsedResources(*ID, SCDesc, STI, ProcResourceMasks);
Andrea Di Biagiodb66efc2018-04-25 09:38:58 +0000387 computeMaxLatency(*ID, MCDesc, SCDesc, STI);
Matt Davis4bcf3692018-08-13 18:11:48 +0000388 if (auto Err = populateWrites(*ID, MCI, SchedClassID))
389 return std::move(Err);
390 if (auto Err = populateReads(*ID, MCI, SchedClassID))
391 return std::move(Err);
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +0000392
Nicola Zaghend34e60c2018-05-14 12:53:11 +0000393 LLVM_DEBUG(dbgs() << "\t\tMaxLatency=" << ID->MaxLatency << '\n');
394 LLVM_DEBUG(dbgs() << "\t\tNumMicroOps=" << ID->NumMicroOps << '\n');
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +0000395
396 // Now add the new descriptor.
Andrea Di Biagio39e5a562018-06-04 15:43:09 +0000397 SchedClassID = MCDesc.getSchedClass();
398 if (!SM.getSchedClassDesc(SchedClassID)->isVariant()) {
399 Descriptors[MCI.getOpcode()] = std::move(ID);
400 return *Descriptors[MCI.getOpcode()];
401 }
402
403 VariantDescriptors[&MCI] = std::move(ID);
404 return *VariantDescriptors[&MCI];
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +0000405}
406
Matt Davis4bcf3692018-08-13 18:11:48 +0000407Expected<const InstrDesc &>
408InstrBuilder::getOrCreateInstrDesc(const MCInst &MCI) {
Andrea Di Biagio39e5a562018-06-04 15:43:09 +0000409 if (Descriptors.find_as(MCI.getOpcode()) != Descriptors.end())
410 return *Descriptors[MCI.getOpcode()];
411
412 if (VariantDescriptors.find(&MCI) != VariantDescriptors.end())
413 return *VariantDescriptors[&MCI];
414
415 return createInstrDescImpl(MCI);
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +0000416}
417
Matt Davis4bcf3692018-08-13 18:11:48 +0000418Expected<std::unique_ptr<Instruction>>
Andrea Di Biagio49c85912018-05-04 13:10:10 +0000419InstrBuilder::createInstruction(const MCInst &MCI) {
Matt Davis4bcf3692018-08-13 18:11:48 +0000420 Expected<const InstrDesc &> DescOrErr = getOrCreateInstrDesc(MCI);
421 if (!DescOrErr)
422 return DescOrErr.takeError();
423 const InstrDesc &D = *DescOrErr;
Andrea Di Biagio7b3d1622018-03-20 12:58:34 +0000424 std::unique_ptr<Instruction> NewIS = llvm::make_unique<Instruction>(D);
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +0000425
Andrea Di Biagio9f9cdd42018-09-18 15:00:06 +0000426 // Check if this is a dependency breaking instruction.
Andrea Di Biagio8b6c3142018-09-19 15:57:45 +0000427 APInt Mask;
428
429 unsigned ProcID = STI.getSchedModel().getProcessorID();
430 bool IsZeroIdiom = MCIA.isZeroIdiom(MCI, Mask, ProcID);
431 bool IsDepBreaking =
432 IsZeroIdiom || MCIA.isDependencyBreaking(MCI, Mask, ProcID);
Andrea Di Biagio9f9cdd42018-09-18 15:00:06 +0000433
Andrea Di Biagiodb66efc2018-04-25 09:38:58 +0000434 // Initialize Reads first.
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +0000435 for (const ReadDescriptor &RD : D.Reads) {
436 int RegID = -1;
Andrea Di Biagio21f0fdb2018-06-22 16:37:05 +0000437 if (!RD.isImplicitRead()) {
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +0000438 // explicit read.
439 const MCOperand &Op = MCI.getOperand(RD.OpIndex);
440 // Skip non-register operands.
441 if (!Op.isReg())
442 continue;
443 RegID = Op.getReg();
444 } else {
445 // Implicit read.
446 RegID = RD.RegisterID;
447 }
448
449 // Skip invalid register operands.
450 if (!RegID)
451 continue;
452
453 // Okay, this is a register operand. Create a ReadState for it.
454 assert(RegID > 0 && "Invalid register ID found!");
Andrea Di Biagio9f9cdd42018-09-18 15:00:06 +0000455 auto RS = llvm::make_unique<ReadState>(RD, RegID);
456
Andrea Di Biagio8b6c3142018-09-19 15:57:45 +0000457 if (IsDepBreaking) {
458 // A mask of all zeroes means: explicit input operands are not
459 // independent.
460 if (Mask.isNullValue()) {
461 if (!RD.isImplicitRead())
462 RS->setIndependentFromDef();
463 } else {
464 // Check if this register operand is independent according to `Mask`.
465 // Note that Mask may not have enough bits to describe all explicit and
466 // implicit input operands. If this register operand doesn't have a
467 // corresponding bit in Mask, then conservatively assume that it is
468 // dependent.
469 if (Mask.getBitWidth() > RD.UseIndex) {
470 // Okay. This map describe register use `RD.UseIndex`.
471 if (Mask[RD.UseIndex])
472 RS->setIndependentFromDef();
473 }
474 }
475 }
Andrea Di Biagio9f9cdd42018-09-18 15:00:06 +0000476 NewIS->getUses().emplace_back(std::move(RS));
Andrea Di Biagio4704f032018-03-20 12:25:54 +0000477 }
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +0000478
Andrea Di Biagio2145b132018-06-20 10:08:11 +0000479 // Early exit if there are no writes.
480 if (D.Writes.empty())
Matt Davis4bcf3692018-08-13 18:11:48 +0000481 return std::move(NewIS);
Andrea Di Biagio2145b132018-06-20 10:08:11 +0000482
483 // Track register writes that implicitly clear the upper portion of the
484 // underlying super-registers using an APInt.
485 APInt WriteMask(D.Writes.size(), 0);
486
487 // Now query the MCInstrAnalysis object to obtain information about which
488 // register writes implicitly clear the upper portion of a super-register.
489 MCIA.clearsSuperRegisters(MRI, MCI, WriteMask);
490
Andrea Di Biagiodb66efc2018-04-25 09:38:58 +0000491 // Initialize writes.
Andrea Di Biagio2145b132018-06-20 10:08:11 +0000492 unsigned WriteIndex = 0;
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +0000493 for (const WriteDescriptor &WD : D.Writes) {
Andrea Di Biagio88347792018-07-09 12:30:55 +0000494 unsigned RegID = WD.isImplicitWrite() ? WD.RegisterID
495 : MCI.getOperand(WD.OpIndex).getReg();
Andrea Di Biagio35622482018-03-22 10:19:20 +0000496 // Check if this is a optional definition that references NoReg.
Andrea Di Biagio2145b132018-06-20 10:08:11 +0000497 if (WD.IsOptionalDef && !RegID) {
498 ++WriteIndex;
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +0000499 continue;
Andrea Di Biagio2145b132018-06-20 10:08:11 +0000500 }
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +0000501
Andrea Di Biagio35622482018-03-22 10:19:20 +0000502 assert(RegID && "Expected a valid register ID!");
Andrea Di Biagiod65492a2018-06-20 14:30:17 +0000503 NewIS->getDefs().emplace_back(llvm::make_unique<WriteState>(
Andrea Di Biagio9f9cdd42018-09-18 15:00:06 +0000504 WD, RegID, /* ClearsSuperRegs */ WriteMask[WriteIndex],
505 /* WritesZero */ IsZeroIdiom));
Andrea Di Biagio2145b132018-06-20 10:08:11 +0000506 ++WriteIndex;
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +0000507 }
508
Matt Davis4bcf3692018-08-13 18:11:48 +0000509 return std::move(NewIS);
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +0000510}
Andrea Di Biagio3a6b0922018-03-08 13:05:02 +0000511} // namespace mca