blob: da7601492f9ed5a762e292e9e92d1a79f731a279 [file] [log] [blame]
Tom Stellard75aadc22012-12-11 21:25:42 +00001//===-- SISchedule.td - SI Scheduling definitons -------------------------===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
Tom Stellardae38f302015-01-14 01:13:19 +000010// MachineModel definitions for Southern Islands (SI)
Tom Stellard75aadc22012-12-11 21:25:42 +000011//
12//===----------------------------------------------------------------------===//
13
Tom Stellardae38f302015-01-14 01:13:19 +000014def WriteBranch : SchedWrite;
15def WriteExport : SchedWrite;
16def WriteLDS : SchedWrite;
17def WriteSALU : SchedWrite;
18def WriteSMEM : SchedWrite;
19def WriteVMEM : SchedWrite;
Matt Arsenault8ac35cd2015-09-08 19:54:32 +000020def WriteBarrier : SchedWrite;
Tom Stellard75aadc22012-12-11 21:25:42 +000021
Tom Stellardae38f302015-01-14 01:13:19 +000022// Vector ALU instructions
23def Write32Bit : SchedWrite;
24def WriteQuarterRate32 : SchedWrite;
25
26def WriteFloatFMA : SchedWrite;
27
28def WriteDouble : SchedWrite;
29def WriteDoubleAdd : SchedWrite;
30
31def SIFullSpeedModel : SchedMachineModel;
32def SIQuarterSpeedModel : SchedMachineModel;
33
34// BufferSize = 0 means the processors are in-order.
35let BufferSize = 0 in {
36
37// XXX: Are the resource counts correct?
38def HWBranch : ProcResource<1>;
39def HWExport : ProcResource<7>; // Taken from S_WAITCNT
40def HWLGKM : ProcResource<31>; // Taken from S_WAITCNT
41def HWSALU : ProcResource<1>;
42def HWVMEM : ProcResource<15>; // Taken from S_WAITCNT
43def HWVALU : ProcResource<1>;
44
45}
46
47class HWWriteRes<SchedWrite write, list<ProcResourceKind> resources,
48 int latency> : WriteRes<write, resources> {
49 let Latency = latency;
50}
51
52class HWVALUWriteRes<SchedWrite write, int latency> :
53 HWWriteRes<write, [HWVALU], latency>;
54
55
56// The latency numbers are taken from AMD Accelerated Parallel Processing
57// guide. They may not be acurate.
58
59// The latency values are 1 / (operations / cycle) / 4.
60multiclass SICommonWriteRes {
61
62 def : HWWriteRes<WriteBranch, [HWBranch], 100>; // XXX: Guessed ???
63 def : HWWriteRes<WriteExport, [HWExport], 100>; // XXX: Guessed ???
64 def : HWWriteRes<WriteLDS, [HWLGKM], 32>; // 2 - 64
65 def : HWWriteRes<WriteSALU, [HWSALU], 1>;
66 def : HWWriteRes<WriteSMEM, [HWLGKM], 10>; // XXX: Guessed ???
67 def : HWWriteRes<WriteVMEM, [HWVMEM], 450>; // 300 - 600
Matt Arsenault8ac35cd2015-09-08 19:54:32 +000068 def : HWWriteRes<WriteBarrier, [HWBranch], 500>; // XXX: Guessed ???
Tom Stellardae38f302015-01-14 01:13:19 +000069
70 def : HWVALUWriteRes<Write32Bit, 1>;
71 def : HWVALUWriteRes<WriteQuarterRate32, 4>;
72}
73
74
75let SchedModel = SIFullSpeedModel in {
76
77defm : SICommonWriteRes;
78
79def : HWVALUWriteRes<WriteFloatFMA, 1>;
80def : HWVALUWriteRes<WriteDouble, 4>;
81def : HWVALUWriteRes<WriteDoubleAdd, 2>;
82
83} // End SchedModel = SIFullSpeedModel
84
85let SchedModel = SIQuarterSpeedModel in {
86
87defm : SICommonWriteRes;
88
89def : HWVALUWriteRes<WriteFloatFMA, 16>;
90def : HWVALUWriteRes<WriteDouble, 16>;
91def : HWVALUWriteRes<WriteDoubleAdd, 8>;
92
93} // End SchedModel = SIQuarterSpeedModel