blob: 0f02f5825cb0d1729475592b3b980749572d5714 [file] [log] [blame]
Tom Stellard75aadc22012-12-11 21:25:42 +00001//===-- SISchedule.td - SI Scheduling definitons -------------------------===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
Tom Stellardae38f302015-01-14 01:13:19 +000010// MachineModel definitions for Southern Islands (SI)
Tom Stellard75aadc22012-12-11 21:25:42 +000011//
12//===----------------------------------------------------------------------===//
13
Matthias Braun1e374a72016-06-24 23:52:11 +000014def : PredicateProlog<[{
15 const SIInstrInfo *TII =
16 static_cast<const SIInstrInfo*>(SchedModel->getInstrInfo());
17 (void)TII;
18}]>;
19
Tom Stellardae38f302015-01-14 01:13:19 +000020def WriteBranch : SchedWrite;
21def WriteExport : SchedWrite;
22def WriteLDS : SchedWrite;
23def WriteSALU : SchedWrite;
24def WriteSMEM : SchedWrite;
25def WriteVMEM : SchedWrite;
Matt Arsenault8ac35cd2015-09-08 19:54:32 +000026def WriteBarrier : SchedWrite;
Tom Stellard75aadc22012-12-11 21:25:42 +000027
Tom Stellardae38f302015-01-14 01:13:19 +000028// Vector ALU instructions
29def Write32Bit : SchedWrite;
30def WriteQuarterRate32 : SchedWrite;
Matt Arsenault5f704362015-09-25 16:58:25 +000031def WriteFullOrQuarterRate32 : SchedWrite;
Tom Stellardae38f302015-01-14 01:13:19 +000032
33def WriteFloatFMA : SchedWrite;
34
Matt Arsenault5f704362015-09-25 16:58:25 +000035// Slow quarter rate f64 instruction.
36def WriteDouble : SchedWrite;
37
38// half rate f64 instruction (same as v_add_f64)
Tom Stellardae38f302015-01-14 01:13:19 +000039def WriteDoubleAdd : SchedWrite;
40
Matt Arsenault5f704362015-09-25 16:58:25 +000041// Half rate 64-bit instructions.
42def Write64Bit : SchedWrite;
43
44// FIXME: Should there be a class for instructions which are VALU
45// instructions and have VALU rates, but write to the SALU (i.e. VOPC
46// instructions)
47
Tom Stellard1d5e6d42016-03-30 16:35:13 +000048class SISchedMachineModel : SchedMachineModel {
Matt Arsenaulta15ea4e2016-08-27 03:39:27 +000049 let CompleteModel = 1;
Tom Stellard0d23ebe2016-08-29 19:42:52 +000050 // MicroOpBufferSize = 1 means that instructions will always be added
51 // the ready queue when they become available. This exposes them
52 // to the register pressure analysis.
53 let MicroOpBufferSize = 1;
Tom Stellard1d5e6d42016-03-30 16:35:13 +000054 let IssueWidth = 1;
Tom Stellardcb6ba622016-04-30 00:23:06 +000055 let PostRAScheduler = 1;
Matt Arsenault9f5e0ef2017-01-25 04:25:02 +000056
57 // FIXME:Approximate 2 * branch cost. Try to hack around bad
58 // early-ifcvt heuristics. These need improvement to avoid the OOE
59 // heuristics.
60 int MispredictPenalty = 20;
Matthias Braun17cb5792016-03-01 20:03:21 +000061}
Tom Stellardae38f302015-01-14 01:13:19 +000062
Tom Stellard1d5e6d42016-03-30 16:35:13 +000063def SIFullSpeedModel : SISchedMachineModel;
64def SIQuarterSpeedModel : SISchedMachineModel;
Tom Stellardae38f302015-01-14 01:13:19 +000065
66// XXX: Are the resource counts correct?
Tom Stellard1d5e6d42016-03-30 16:35:13 +000067def HWBranch : ProcResource<1> {
68 let BufferSize = 1;
69}
70def HWExport : ProcResource<1> {
71 let BufferSize = 7; // Taken from S_WAITCNT
72}
73def HWLGKM : ProcResource<1> {
74 let BufferSize = 31; // Taken from S_WAITCNT
75}
76def HWSALU : ProcResource<1> {
77 let BufferSize = 1;
78}
79def HWVMEM : ProcResource<1> {
80 let BufferSize = 15; // Taken from S_WAITCNT
81}
82def HWVALU : ProcResource<1> {
83 let BufferSize = 1;
Tom Stellardae38f302015-01-14 01:13:19 +000084}
85
86class HWWriteRes<SchedWrite write, list<ProcResourceKind> resources,
87 int latency> : WriteRes<write, resources> {
88 let Latency = latency;
89}
90
91class HWVALUWriteRes<SchedWrite write, int latency> :
92 HWWriteRes<write, [HWVALU], latency>;
93
94
95// The latency numbers are taken from AMD Accelerated Parallel Processing
Matt Arsenault5f704362015-09-25 16:58:25 +000096// guide. They may not be accurate.
Tom Stellardae38f302015-01-14 01:13:19 +000097
98// The latency values are 1 / (operations / cycle) / 4.
99multiclass SICommonWriteRes {
100
Tom Stellard1d5e6d42016-03-30 16:35:13 +0000101 def : HWWriteRes<WriteBranch, [HWBranch], 8>;
102 def : HWWriteRes<WriteExport, [HWExport], 4>;
103 def : HWWriteRes<WriteLDS, [HWLGKM], 5>; // Can be between 2 and 64
104 def : HWWriteRes<WriteSALU, [HWSALU], 1>;
105 def : HWWriteRes<WriteSMEM, [HWLGKM], 5>;
106 def : HWWriteRes<WriteVMEM, [HWVMEM], 80>;
Matt Arsenault8ac35cd2015-09-08 19:54:32 +0000107 def : HWWriteRes<WriteBarrier, [HWBranch], 500>; // XXX: Guessed ???
Tom Stellardae38f302015-01-14 01:13:19 +0000108
109 def : HWVALUWriteRes<Write32Bit, 1>;
Matt Arsenault5f704362015-09-25 16:58:25 +0000110 def : HWVALUWriteRes<Write64Bit, 2>;
Tom Stellardae38f302015-01-14 01:13:19 +0000111 def : HWVALUWriteRes<WriteQuarterRate32, 4>;
112}
113
Matthias Braun1e374a72016-06-24 23:52:11 +0000114def PredIsVGPR32Copy : SchedPredicate<[{TII->isVGPRCopy(*MI) && TII->getOpSize(*MI, 0) <= 32}]>;
115def PredIsVGPR64Copy : SchedPredicate<[{TII->isVGPRCopy(*MI) && TII->getOpSize(*MI, 0) > 32}]>;
116def WriteCopy : SchedWriteVariant<[
117 SchedVar<PredIsVGPR32Copy, [Write32Bit]>,
118 SchedVar<PredIsVGPR64Copy, [Write64Bit]>,
119 SchedVar<NoSchedPred, [WriteSALU]>]>;
Tom Stellardae38f302015-01-14 01:13:19 +0000120
121let SchedModel = SIFullSpeedModel in {
122
123defm : SICommonWriteRes;
124
125def : HWVALUWriteRes<WriteFloatFMA, 1>;
126def : HWVALUWriteRes<WriteDouble, 4>;
127def : HWVALUWriteRes<WriteDoubleAdd, 2>;
128
Matthias Braun1e374a72016-06-24 23:52:11 +0000129def : InstRW<[WriteCopy], (instrs COPY)>;
130
Tom Stellardae38f302015-01-14 01:13:19 +0000131} // End SchedModel = SIFullSpeedModel
132
133let SchedModel = SIQuarterSpeedModel in {
134
135defm : SICommonWriteRes;
136
137def : HWVALUWriteRes<WriteFloatFMA, 16>;
138def : HWVALUWriteRes<WriteDouble, 16>;
139def : HWVALUWriteRes<WriteDoubleAdd, 8>;
140
Matthias Braun1e374a72016-06-24 23:52:11 +0000141def : InstRW<[WriteCopy], (instrs COPY)>;
142
Tom Stellardae38f302015-01-14 01:13:19 +0000143} // End SchedModel = SIQuarterSpeedModel