blob: 0db92fc254f39a4230cad1a7b493de1f7f7c8fb6 [file] [log] [blame]
Tom Stellard75aadc22012-12-11 21:25:42 +00001//===-- SISchedule.td - SI Scheduling definitons -------------------------===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
Tom Stellardae38f302015-01-14 01:13:19 +000010// MachineModel definitions for Southern Islands (SI)
Tom Stellard75aadc22012-12-11 21:25:42 +000011//
12//===----------------------------------------------------------------------===//
13
Matthias Braun1e374a72016-06-24 23:52:11 +000014def : PredicateProlog<[{
15 const SIInstrInfo *TII =
16 static_cast<const SIInstrInfo*>(SchedModel->getInstrInfo());
17 (void)TII;
18}]>;
19
Tom Stellardae38f302015-01-14 01:13:19 +000020def WriteBranch : SchedWrite;
21def WriteExport : SchedWrite;
22def WriteLDS : SchedWrite;
23def WriteSALU : SchedWrite;
24def WriteSMEM : SchedWrite;
25def WriteVMEM : SchedWrite;
Matt Arsenault8ac35cd2015-09-08 19:54:32 +000026def WriteBarrier : SchedWrite;
Tom Stellard75aadc22012-12-11 21:25:42 +000027
Tom Stellardae38f302015-01-14 01:13:19 +000028// Vector ALU instructions
29def Write32Bit : SchedWrite;
30def WriteQuarterRate32 : SchedWrite;
Matt Arsenault5f704362015-09-25 16:58:25 +000031def WriteFullOrQuarterRate32 : SchedWrite;
Tom Stellardae38f302015-01-14 01:13:19 +000032
33def WriteFloatFMA : SchedWrite;
34
Matt Arsenault5f704362015-09-25 16:58:25 +000035// Slow quarter rate f64 instruction.
36def WriteDouble : SchedWrite;
37
38// half rate f64 instruction (same as v_add_f64)
Tom Stellardae38f302015-01-14 01:13:19 +000039def WriteDoubleAdd : SchedWrite;
40
Matt Arsenault5f704362015-09-25 16:58:25 +000041// Half rate 64-bit instructions.
42def Write64Bit : SchedWrite;
43
44// FIXME: Should there be a class for instructions which are VALU
45// instructions and have VALU rates, but write to the SALU (i.e. VOPC
46// instructions)
47
Tom Stellard1d5e6d42016-03-30 16:35:13 +000048class SISchedMachineModel : SchedMachineModel {
Matt Arsenaulta15ea4e2016-08-27 03:39:27 +000049 let CompleteModel = 1;
Tom Stellard1d5e6d42016-03-30 16:35:13 +000050 let IssueWidth = 1;
Tom Stellardcb6ba622016-04-30 00:23:06 +000051 let PostRAScheduler = 1;
Matthias Braun17cb5792016-03-01 20:03:21 +000052}
Tom Stellardae38f302015-01-14 01:13:19 +000053
Tom Stellard1d5e6d42016-03-30 16:35:13 +000054def SIFullSpeedModel : SISchedMachineModel;
55def SIQuarterSpeedModel : SISchedMachineModel;
Tom Stellardae38f302015-01-14 01:13:19 +000056
57// XXX: Are the resource counts correct?
Tom Stellard1d5e6d42016-03-30 16:35:13 +000058def HWBranch : ProcResource<1> {
59 let BufferSize = 1;
60}
61def HWExport : ProcResource<1> {
62 let BufferSize = 7; // Taken from S_WAITCNT
63}
64def HWLGKM : ProcResource<1> {
65 let BufferSize = 31; // Taken from S_WAITCNT
66}
67def HWSALU : ProcResource<1> {
68 let BufferSize = 1;
69}
70def HWVMEM : ProcResource<1> {
71 let BufferSize = 15; // Taken from S_WAITCNT
72}
73def HWVALU : ProcResource<1> {
74 let BufferSize = 1;
Tom Stellardae38f302015-01-14 01:13:19 +000075}
76
77class HWWriteRes<SchedWrite write, list<ProcResourceKind> resources,
78 int latency> : WriteRes<write, resources> {
79 let Latency = latency;
80}
81
82class HWVALUWriteRes<SchedWrite write, int latency> :
83 HWWriteRes<write, [HWVALU], latency>;
84
85
86// The latency numbers are taken from AMD Accelerated Parallel Processing
Matt Arsenault5f704362015-09-25 16:58:25 +000087// guide. They may not be accurate.
Tom Stellardae38f302015-01-14 01:13:19 +000088
89// The latency values are 1 / (operations / cycle) / 4.
90multiclass SICommonWriteRes {
91
Tom Stellard1d5e6d42016-03-30 16:35:13 +000092 def : HWWriteRes<WriteBranch, [HWBranch], 8>;
93 def : HWWriteRes<WriteExport, [HWExport], 4>;
94 def : HWWriteRes<WriteLDS, [HWLGKM], 5>; // Can be between 2 and 64
95 def : HWWriteRes<WriteSALU, [HWSALU], 1>;
96 def : HWWriteRes<WriteSMEM, [HWLGKM], 5>;
97 def : HWWriteRes<WriteVMEM, [HWVMEM], 80>;
Matt Arsenault8ac35cd2015-09-08 19:54:32 +000098 def : HWWriteRes<WriteBarrier, [HWBranch], 500>; // XXX: Guessed ???
Tom Stellardae38f302015-01-14 01:13:19 +000099
100 def : HWVALUWriteRes<Write32Bit, 1>;
Matt Arsenault5f704362015-09-25 16:58:25 +0000101 def : HWVALUWriteRes<Write64Bit, 2>;
Tom Stellardae38f302015-01-14 01:13:19 +0000102 def : HWVALUWriteRes<WriteQuarterRate32, 4>;
103}
104
Matthias Braun1e374a72016-06-24 23:52:11 +0000105def PredIsVGPR32Copy : SchedPredicate<[{TII->isVGPRCopy(*MI) && TII->getOpSize(*MI, 0) <= 32}]>;
106def PredIsVGPR64Copy : SchedPredicate<[{TII->isVGPRCopy(*MI) && TII->getOpSize(*MI, 0) > 32}]>;
107def WriteCopy : SchedWriteVariant<[
108 SchedVar<PredIsVGPR32Copy, [Write32Bit]>,
109 SchedVar<PredIsVGPR64Copy, [Write64Bit]>,
110 SchedVar<NoSchedPred, [WriteSALU]>]>;
Tom Stellardae38f302015-01-14 01:13:19 +0000111
112let SchedModel = SIFullSpeedModel in {
113
114defm : SICommonWriteRes;
115
116def : HWVALUWriteRes<WriteFloatFMA, 1>;
117def : HWVALUWriteRes<WriteDouble, 4>;
118def : HWVALUWriteRes<WriteDoubleAdd, 2>;
119
Matthias Braun1e374a72016-06-24 23:52:11 +0000120def : InstRW<[WriteCopy], (instrs COPY)>;
121
Tom Stellardae38f302015-01-14 01:13:19 +0000122} // End SchedModel = SIFullSpeedModel
123
124let SchedModel = SIQuarterSpeedModel in {
125
126defm : SICommonWriteRes;
127
128def : HWVALUWriteRes<WriteFloatFMA, 16>;
129def : HWVALUWriteRes<WriteDouble, 16>;
130def : HWVALUWriteRes<WriteDoubleAdd, 8>;
131
Matthias Braun1e374a72016-06-24 23:52:11 +0000132def : InstRW<[WriteCopy], (instrs COPY)>;
133
Tom Stellardae38f302015-01-14 01:13:19 +0000134} // End SchedModel = SIQuarterSpeedModel