| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 1 | //===-- AMDGPU.td - AMDGPU Tablegen files --------*- tablegen -*-===// |
| Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
| 7 | // |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 8 | //===------------------------------------------------------------===// |
| Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 9 | |
| Tom Stellard | bc5b537 | 2014-06-13 16:38:59 +0000 | [diff] [blame] | 10 | include "llvm/Target/Target.td" |
| Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 11 | |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 12 | //===------------------------------------------------------------===// |
| 13 | // Subtarget Features (device properties) |
| 14 | //===------------------------------------------------------------===// |
| Tom Stellard | 783893a | 2013-11-18 19:43:33 +0000 | [diff] [blame] | 15 | |
| Matt Arsenault | f5e2997 | 2014-06-20 06:50:05 +0000 | [diff] [blame] | 16 | def FeatureFP64 : SubtargetFeature<"fp64", |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 17 | "FP64", |
| 18 | "true", |
| 19 | "Enable double precision operations" |
| 20 | >; |
| Matt Arsenault | f171cf2 | 2014-07-14 23:40:49 +0000 | [diff] [blame] | 21 | |
| Matt Arsenault | b035a57 | 2015-01-29 19:34:25 +0000 | [diff] [blame] | 22 | def FeatureFastFMAF32 : SubtargetFeature<"fast-fmaf", |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 23 | "FastFMAF32", |
| 24 | "true", |
| 25 | "Assuming f32 fma is at least as fast as mul + add" |
| 26 | >; |
| Matt Arsenault | b035a57 | 2015-01-29 19:34:25 +0000 | [diff] [blame] | 27 | |
| Matt Arsenault | e83690c | 2016-01-18 21:13:50 +0000 | [diff] [blame] | 28 | def HalfRate64Ops : SubtargetFeature<"half-rate-64-ops", |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 29 | "HalfRate64Ops", |
| 30 | "true", |
| 31 | "Most fp64 instructions are half rate instead of quarter" |
| 32 | >; |
| Matt Arsenault | f171cf2 | 2014-07-14 23:40:49 +0000 | [diff] [blame] | 33 | |
| Tom Stellard | 9979277 | 2013-06-07 20:28:49 +0000 | [diff] [blame] | 34 | def FeatureR600ALUInst : SubtargetFeature<"R600ALUInst", |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 35 | "R600ALUInst", |
| 36 | "false", |
| 37 | "Older version of ALU instructions encoding" |
| 38 | >; |
| Tom Stellard | 9979277 | 2013-06-07 20:28:49 +0000 | [diff] [blame] | 39 | |
| 40 | def FeatureVertexCache : SubtargetFeature<"HasVertexCache", |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 41 | "HasVertexCache", |
| 42 | "true", |
| 43 | "Specify use of dedicated vertex cache" |
| 44 | >; |
| Tom Stellard | 9979277 | 2013-06-07 20:28:49 +0000 | [diff] [blame] | 45 | |
| Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 46 | def FeatureCaymanISA : SubtargetFeature<"caymanISA", |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 47 | "CaymanISA", |
| 48 | "true", |
| 49 | "Use Cayman ISA" |
| 50 | >; |
| Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 51 | |
| Tom Stellard | 348273d | 2014-01-23 16:18:02 +0000 | [diff] [blame] | 52 | def FeatureCFALUBug : SubtargetFeature<"cfalubug", |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 53 | "CFALUBug", |
| 54 | "true", |
| 55 | "GPU has CF_ALU bug" |
| 56 | >; |
| Changpeng Fang | b41574a | 2015-12-22 20:55:23 +0000 | [diff] [blame] | 57 | |
| Matt Arsenault | 3f98140 | 2014-09-15 15:41:53 +0000 | [diff] [blame] | 58 | def FeatureFlatAddressSpace : SubtargetFeature<"flat-address-space", |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 59 | "FlatAddressSpace", |
| 60 | "true", |
| 61 | "Support flat address space" |
| 62 | >; |
| Matt Arsenault | 3f98140 | 2014-09-15 15:41:53 +0000 | [diff] [blame] | 63 | |
| Matt Arsenault | 7f681ac | 2016-07-01 23:03:44 +0000 | [diff] [blame] | 64 | def FeatureUnalignedBufferAccess : SubtargetFeature<"unaligned-buffer-access", |
| 65 | "UnalignedBufferAccess", |
| 66 | "true", |
| 67 | "Support unaligned global loads and stores" |
| 68 | >; |
| 69 | |
| Tom Stellard | 64a9d08 | 2016-10-14 18:10:39 +0000 | [diff] [blame^] | 70 | def FeatureUnalignedScratchAccess : SubtargetFeature<"unaligned-scratch-access", |
| 71 | "UnalignedScratchAccess", |
| 72 | "true", |
| 73 | "Support unaligned scratch loads and stores" |
| 74 | >; |
| 75 | |
| Nicolai Haehnle | 5b50497 | 2016-01-04 23:35:53 +0000 | [diff] [blame] | 76 | def FeatureXNACK : SubtargetFeature<"xnack", |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 77 | "EnableXNACK", |
| 78 | "true", |
| 79 | "Enable XNACK support" |
| 80 | >; |
| Tom Stellard | e99fb65 | 2015-01-20 19:33:04 +0000 | [diff] [blame] | 81 | |
| Marek Olsak | 4d00dd2 | 2015-03-09 15:48:09 +0000 | [diff] [blame] | 82 | def FeatureSGPRInitBug : SubtargetFeature<"sgpr-init-bug", |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 83 | "SGPRInitBug", |
| 84 | "true", |
| 85 | "VI SGPR initilization bug requiring a fixed SGPR allocation size" |
| 86 | >; |
| Tom Stellard | de008d3 | 2016-01-21 04:28:34 +0000 | [diff] [blame] | 87 | |
| Tom Stellard | 3498e4f | 2013-06-07 20:28:55 +0000 | [diff] [blame] | 88 | class SubtargetFeatureFetchLimit <string Value> : |
| 89 | SubtargetFeature <"fetch"#Value, |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 90 | "TexVTXClauseSize", |
| 91 | Value, |
| 92 | "Limit the maximum number of fetches in a clause to "#Value |
| 93 | >; |
| Tom Stellard | 9979277 | 2013-06-07 20:28:49 +0000 | [diff] [blame] | 94 | |
| Tom Stellard | 3498e4f | 2013-06-07 20:28:55 +0000 | [diff] [blame] | 95 | def FeatureFetchLimit8 : SubtargetFeatureFetchLimit <"8">; |
| 96 | def FeatureFetchLimit16 : SubtargetFeatureFetchLimit <"16">; |
| 97 | |
| Tom Stellard | 8c347b0 | 2014-01-22 21:55:40 +0000 | [diff] [blame] | 98 | class SubtargetFeatureWavefrontSize <int Value> : SubtargetFeature< |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 99 | "wavefrontsize"#Value, |
| 100 | "WavefrontSize", |
| 101 | !cast<string>(Value), |
| 102 | "The number of threads per wavefront" |
| 103 | >; |
| Tom Stellard | 8c347b0 | 2014-01-22 21:55:40 +0000 | [diff] [blame] | 104 | |
| 105 | def FeatureWavefrontSize16 : SubtargetFeatureWavefrontSize<16>; |
| 106 | def FeatureWavefrontSize32 : SubtargetFeatureWavefrontSize<32>; |
| 107 | def FeatureWavefrontSize64 : SubtargetFeatureWavefrontSize<64>; |
| 108 | |
| Tom Stellard | ec87f84 | 2015-05-25 16:15:54 +0000 | [diff] [blame] | 109 | class SubtargetFeatureLDSBankCount <int Value> : SubtargetFeature < |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 110 | "ldsbankcount"#Value, |
| 111 | "LDSBankCount", |
| 112 | !cast<string>(Value), |
| 113 | "The number of LDS banks per compute unit." |
| 114 | >; |
| Tom Stellard | ec87f84 | 2015-05-25 16:15:54 +0000 | [diff] [blame] | 115 | |
| 116 | def FeatureLDSBankCount16 : SubtargetFeatureLDSBankCount<16>; |
| 117 | def FeatureLDSBankCount32 : SubtargetFeatureLDSBankCount<32>; |
| 118 | |
| Tom Stellard | 347ac79 | 2015-06-26 21:15:07 +0000 | [diff] [blame] | 119 | class SubtargetFeatureISAVersion <int Major, int Minor, int Stepping> |
| 120 | : SubtargetFeature < |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 121 | "isaver"#Major#"."#Minor#"."#Stepping, |
| 122 | "IsaVersion", |
| 123 | "ISAVersion"#Major#"_"#Minor#"_"#Stepping, |
| 124 | "Instruction set version number" |
| Tom Stellard | 347ac79 | 2015-06-26 21:15:07 +0000 | [diff] [blame] | 125 | >; |
| 126 | |
| 127 | def FeatureISAVersion7_0_0 : SubtargetFeatureISAVersion <7,0,0>; |
| 128 | def FeatureISAVersion7_0_1 : SubtargetFeatureISAVersion <7,0,1>; |
| 129 | def FeatureISAVersion8_0_0 : SubtargetFeatureISAVersion <8,0,0>; |
| 130 | def FeatureISAVersion8_0_1 : SubtargetFeatureISAVersion <8,0,1>; |
| Changpeng Fang | 98317d2 | 2016-10-11 16:00:47 +0000 | [diff] [blame] | 131 | def FeatureISAVersion8_0_2 : SubtargetFeatureISAVersion <8,0,2>; |
| Changpeng Fang | c16be00 | 2016-01-13 20:39:25 +0000 | [diff] [blame] | 132 | def FeatureISAVersion8_0_3 : SubtargetFeatureISAVersion <8,0,3>; |
| Tom Stellard | 347ac79 | 2015-06-26 21:15:07 +0000 | [diff] [blame] | 133 | |
| Tom Stellard | 880a80a | 2014-06-17 16:53:14 +0000 | [diff] [blame] | 134 | class SubtargetFeatureLocalMemorySize <int Value> : SubtargetFeature< |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 135 | "localmemorysize"#Value, |
| 136 | "LocalMemorySize", |
| 137 | !cast<string>(Value), |
| 138 | "The size of local memory in bytes" |
| 139 | >; |
| Tom Stellard | 880a80a | 2014-06-17 16:53:14 +0000 | [diff] [blame] | 140 | |
| Tom Stellard | d7e6f13 | 2015-04-08 01:09:26 +0000 | [diff] [blame] | 141 | def FeatureGCN : SubtargetFeature<"gcn", |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 142 | "IsGCN", |
| 143 | "true", |
| 144 | "GCN or newer GPU" |
| 145 | >; |
| Tom Stellard | d7e6f13 | 2015-04-08 01:09:26 +0000 | [diff] [blame] | 146 | |
| 147 | def FeatureGCN1Encoding : SubtargetFeature<"gcn1-encoding", |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 148 | "GCN1Encoding", |
| 149 | "true", |
| 150 | "Encoding format for SI and CI" |
| 151 | >; |
| Tom Stellard | d7e6f13 | 2015-04-08 01:09:26 +0000 | [diff] [blame] | 152 | |
| 153 | def FeatureGCN3Encoding : SubtargetFeature<"gcn3-encoding", |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 154 | "GCN3Encoding", |
| 155 | "true", |
| 156 | "Encoding format for VI" |
| 157 | >; |
| Tom Stellard | d1f0f02 | 2015-04-23 19:33:54 +0000 | [diff] [blame] | 158 | |
| 159 | def FeatureCIInsts : SubtargetFeature<"ci-insts", |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 160 | "CIInsts", |
| 161 | "true", |
| 162 | "Additional intstructions for CI+" |
| 163 | >; |
| 164 | |
| Matt Arsenault | 9d82ee7 | 2016-02-27 08:53:55 +0000 | [diff] [blame] | 165 | def FeatureSMemRealTime : SubtargetFeature<"s-memrealtime", |
| 166 | "HasSMemRealTime", |
| Matt Arsenault | 61738cb | 2016-02-27 08:53:46 +0000 | [diff] [blame] | 167 | "true", |
| Matt Arsenault | 9d82ee7 | 2016-02-27 08:53:55 +0000 | [diff] [blame] | 168 | "Has s_memrealtime instruction" |
| 169 | >; |
| 170 | |
| 171 | def Feature16BitInsts : SubtargetFeature<"16-bit-insts", |
| 172 | "Has16BitInsts", |
| 173 | "true", |
| 174 | "Has i16/f16 instructions" |
| Matt Arsenault | 61738cb | 2016-02-27 08:53:46 +0000 | [diff] [blame] | 175 | >; |
| 176 | |
| Matt Arsenault | cc88ce3 | 2016-10-12 18:00:51 +0000 | [diff] [blame] | 177 | def FeatureMovrel : SubtargetFeature<"movrel", |
| 178 | "HasMovrel", |
| 179 | "true", |
| 180 | "Has v_movrel*_b32 instructions" |
| 181 | >; |
| 182 | |
| 183 | def FeatureVGPRIndexMode : SubtargetFeature<"vgpr-index-mode", |
| 184 | "HasVGPRIndexMode", |
| 185 | "true", |
| 186 | "Has VGPR mode register indexing" |
| 187 | >; |
| 188 | |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 189 | //===------------------------------------------------------------===// |
| 190 | // Subtarget Features (options and debugging) |
| 191 | //===------------------------------------------------------------===// |
| 192 | |
| 193 | // Some instructions do not support denormals despite this flag. Using |
| 194 | // fp32 denormals also causes instructions to run at the double |
| 195 | // precision rate for the device. |
| 196 | def FeatureFP32Denormals : SubtargetFeature<"fp32-denormals", |
| 197 | "FP32Denormals", |
| 198 | "true", |
| 199 | "Enable single precision denormal handling" |
| 200 | >; |
| 201 | |
| 202 | def FeatureFP64Denormals : SubtargetFeature<"fp64-denormals", |
| 203 | "FP64Denormals", |
| 204 | "true", |
| 205 | "Enable double precision denormal handling", |
| 206 | [FeatureFP64] |
| 207 | >; |
| 208 | |
| Matt Arsenault | f639c32 | 2016-01-28 20:53:42 +0000 | [diff] [blame] | 209 | def FeatureFPExceptions : SubtargetFeature<"fp-exceptions", |
| 210 | "FPExceptions", |
| 211 | "true", |
| 212 | "Enable floating point exceptions" |
| 213 | >; |
| 214 | |
| Matt Arsenault | 24ee078 | 2016-02-12 02:40:47 +0000 | [diff] [blame] | 215 | class FeatureMaxPrivateElementSize<int size> : SubtargetFeature< |
| 216 | "max-private-element-size-"#size, |
| 217 | "MaxPrivateElementSize", |
| 218 | !cast<string>(size), |
| 219 | "Maximum private access size may be "#size |
| 220 | >; |
| 221 | |
| 222 | def FeatureMaxPrivateElementSize4 : FeatureMaxPrivateElementSize<4>; |
| 223 | def FeatureMaxPrivateElementSize8 : FeatureMaxPrivateElementSize<8>; |
| 224 | def FeatureMaxPrivateElementSize16 : FeatureMaxPrivateElementSize<16>; |
| 225 | |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 226 | def FeatureVGPRSpilling : SubtargetFeature<"vgpr-spilling", |
| 227 | "EnableVGPRSpilling", |
| 228 | "true", |
| 229 | "Enable spilling of VGPRs to scratch memory" |
| 230 | >; |
| 231 | |
| 232 | def FeatureDumpCode : SubtargetFeature <"DumpCode", |
| 233 | "DumpCode", |
| 234 | "true", |
| 235 | "Dump MachineInstrs in the CodeEmitter" |
| 236 | >; |
| 237 | |
| 238 | def FeatureDumpCodeLower : SubtargetFeature <"dumpcode", |
| 239 | "DumpCode", |
| 240 | "true", |
| 241 | "Dump MachineInstrs in the CodeEmitter" |
| 242 | >; |
| 243 | |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 244 | def FeaturePromoteAlloca : SubtargetFeature <"promote-alloca", |
| 245 | "EnablePromoteAlloca", |
| 246 | "true", |
| 247 | "Enable promote alloca pass" |
| 248 | >; |
| 249 | |
| 250 | // XXX - This should probably be removed once enabled by default |
| 251 | def FeatureEnableLoadStoreOpt : SubtargetFeature <"load-store-opt", |
| 252 | "EnableLoadStoreOpt", |
| 253 | "true", |
| 254 | "Enable SI load/store optimizer pass" |
| 255 | >; |
| 256 | |
| 257 | // Performance debugging feature. Allow using DS instruction immediate |
| 258 | // offsets even if the base pointer can't be proven to be base. On SI, |
| 259 | // base pointer values that won't give the same result as a 16-bit add |
| 260 | // are not safe to fold, but this will override the conservative test |
| 261 | // for the base pointer. |
| 262 | def FeatureEnableUnsafeDSOffsetFolding : SubtargetFeature < |
| 263 | "unsafe-ds-offset-folding", |
| 264 | "EnableUnsafeDSOffsetFolding", |
| 265 | "true", |
| 266 | "Force using DS instruction immediate offsets on SI" |
| 267 | >; |
| 268 | |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 269 | def FeatureEnableSIScheduler : SubtargetFeature<"si-scheduler", |
| 270 | "EnableSIScheduler", |
| 271 | "true", |
| 272 | "Enable SI Machine Scheduler" |
| 273 | >; |
| 274 | |
| 275 | def FeatureFlatForGlobal : SubtargetFeature<"flat-for-global", |
| 276 | "FlatForGlobal", |
| 277 | "true", |
| 278 | "Force to generate flat instruction for global" |
| 279 | >; |
| Tom Stellard | d1f0f02 | 2015-04-23 19:33:54 +0000 | [diff] [blame] | 280 | |
| 281 | // Dummy feature used to disable assembler instructions. |
| 282 | def FeatureDisable : SubtargetFeature<"", |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 283 | "FeatureDisable","true", |
| 284 | "Dummy feature to disable assembler instructions" |
| 285 | >; |
| Tom Stellard | d1f0f02 | 2015-04-23 19:33:54 +0000 | [diff] [blame] | 286 | |
| Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 287 | class SubtargetFeatureGeneration <string Value, |
| 288 | list<SubtargetFeature> Implies> : |
| 289 | SubtargetFeature <Value, "Gen", "AMDGPUSubtarget::"#Value, |
| 290 | Value#" GPU generation", Implies>; |
| 291 | |
| Tom Stellard | 880a80a | 2014-06-17 16:53:14 +0000 | [diff] [blame] | 292 | def FeatureLocalMemorySize0 : SubtargetFeatureLocalMemorySize<0>; |
| 293 | def FeatureLocalMemorySize32768 : SubtargetFeatureLocalMemorySize<32768>; |
| 294 | def FeatureLocalMemorySize65536 : SubtargetFeatureLocalMemorySize<65536>; |
| 295 | |
| Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 296 | def FeatureR600 : SubtargetFeatureGeneration<"R600", |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 297 | [FeatureR600ALUInst, FeatureFetchLimit8, FeatureLocalMemorySize0] |
| 298 | >; |
| Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 299 | |
| 300 | def FeatureR700 : SubtargetFeatureGeneration<"R700", |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 301 | [FeatureFetchLimit16, FeatureLocalMemorySize0] |
| 302 | >; |
| Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 303 | |
| 304 | def FeatureEvergreen : SubtargetFeatureGeneration<"EVERGREEN", |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 305 | [FeatureFetchLimit16, FeatureLocalMemorySize32768] |
| 306 | >; |
| Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 307 | |
| 308 | def FeatureNorthernIslands : SubtargetFeatureGeneration<"NORTHERN_ISLANDS", |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 309 | [FeatureFetchLimit16, FeatureWavefrontSize64, |
| 310 | FeatureLocalMemorySize32768] |
| Tom Stellard | 880a80a | 2014-06-17 16:53:14 +0000 | [diff] [blame] | 311 | >; |
| Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 312 | |
| 313 | def FeatureSouthernIslands : SubtargetFeatureGeneration<"SOUTHERN_ISLANDS", |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 314 | [FeatureFP64, FeatureLocalMemorySize32768, |
| 315 | FeatureWavefrontSize64, FeatureGCN, FeatureGCN1Encoding, |
| Matt Arsenault | cc88ce3 | 2016-10-12 18:00:51 +0000 | [diff] [blame] | 316 | FeatureLDSBankCount32, FeatureMovrel] |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 317 | >; |
| Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 318 | |
| Tom Stellard | 6e1ee47 | 2013-10-29 16:37:28 +0000 | [diff] [blame] | 319 | def FeatureSeaIslands : SubtargetFeatureGeneration<"SEA_ISLANDS", |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 320 | [FeatureFP64, FeatureLocalMemorySize65536, |
| 321 | FeatureWavefrontSize64, FeatureGCN, FeatureFlatAddressSpace, |
| Matt Arsenault | cc88ce3 | 2016-10-12 18:00:51 +0000 | [diff] [blame] | 322 | FeatureGCN1Encoding, FeatureCIInsts, FeatureMovrel] |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 323 | >; |
| Marek Olsak | 5df00d6 | 2014-12-07 12:18:57 +0000 | [diff] [blame] | 324 | |
| 325 | def FeatureVolcanicIslands : SubtargetFeatureGeneration<"VOLCANIC_ISLANDS", |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 326 | [FeatureFP64, FeatureLocalMemorySize65536, |
| 327 | FeatureWavefrontSize64, FeatureFlatAddressSpace, FeatureGCN, |
| Matt Arsenault | 9d82ee7 | 2016-02-27 08:53:55 +0000 | [diff] [blame] | 328 | FeatureGCN3Encoding, FeatureCIInsts, Feature16BitInsts, |
| Matt Arsenault | cc88ce3 | 2016-10-12 18:00:51 +0000 | [diff] [blame] | 329 | FeatureSMemRealTime, FeatureVGPRIndexMode, FeatureMovrel |
| Matt Arsenault | 9d82ee7 | 2016-02-27 08:53:55 +0000 | [diff] [blame] | 330 | ] |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 331 | >; |
| Marek Olsak | 5df00d6 | 2014-12-07 12:18:57 +0000 | [diff] [blame] | 332 | |
| Tom Stellard | 3498e4f | 2013-06-07 20:28:55 +0000 | [diff] [blame] | 333 | //===----------------------------------------------------------------------===// |
| Konstantin Zhuravlyov | 8c273ad | 2016-04-18 16:28:23 +0000 | [diff] [blame] | 334 | // Debugger related subtarget features. |
| 335 | //===----------------------------------------------------------------------===// |
| 336 | |
| 337 | def FeatureDebuggerInsertNops : SubtargetFeature< |
| 338 | "amdgpu-debugger-insert-nops", |
| 339 | "DebuggerInsertNops", |
| 340 | "true", |
| Konstantin Zhuravlyov | e3d322a | 2016-05-13 18:21:28 +0000 | [diff] [blame] | 341 | "Insert one nop instruction for each high level source statement" |
| Konstantin Zhuravlyov | 8c273ad | 2016-04-18 16:28:23 +0000 | [diff] [blame] | 342 | >; |
| 343 | |
| Konstantin Zhuravlyov | 29ddd2b | 2016-05-24 18:37:18 +0000 | [diff] [blame] | 344 | def FeatureDebuggerReserveRegs : SubtargetFeature< |
| 345 | "amdgpu-debugger-reserve-regs", |
| 346 | "DebuggerReserveRegs", |
| Konstantin Zhuravlyov | 1d99c4d | 2016-04-26 15:43:14 +0000 | [diff] [blame] | 347 | "true", |
| Konstantin Zhuravlyov | 29ddd2b | 2016-05-24 18:37:18 +0000 | [diff] [blame] | 348 | "Reserve registers for debugger usage" |
| Konstantin Zhuravlyov | 1d99c4d | 2016-04-26 15:43:14 +0000 | [diff] [blame] | 349 | >; |
| 350 | |
| Konstantin Zhuravlyov | f2f3d14 | 2016-06-25 03:11:28 +0000 | [diff] [blame] | 351 | def FeatureDebuggerEmitPrologue : SubtargetFeature< |
| 352 | "amdgpu-debugger-emit-prologue", |
| 353 | "DebuggerEmitPrologue", |
| 354 | "true", |
| 355 | "Emit debugger prologue" |
| 356 | >; |
| 357 | |
| Konstantin Zhuravlyov | 8c273ad | 2016-04-18 16:28:23 +0000 | [diff] [blame] | 358 | //===----------------------------------------------------------------------===// |
| Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 359 | |
| 360 | def AMDGPUInstrInfo : InstrInfo { |
| 361 | let guessInstructionProperties = 1; |
| Matt Arsenault | 1ecac06 | 2015-02-18 02:15:32 +0000 | [diff] [blame] | 362 | let noNamedPositionallyEncodedOperands = 1; |
| Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 363 | } |
| 364 | |
| Tom Stellard | 9d7ddd5 | 2014-11-14 14:08:00 +0000 | [diff] [blame] | 365 | def AMDGPUAsmParser : AsmParser { |
| 366 | // Some of the R600 registers have the same name, so this crashes. |
| 367 | // For example T0_XYZW and T0_XY both have the asm name T0. |
| 368 | let ShouldEmitMatchRegisterName = 0; |
| 369 | } |
| 370 | |
| Konstantin Zhuravlyov | da4687c | 2016-09-27 14:42:48 +0000 | [diff] [blame] | 371 | def AMDGPUAsmWriter : AsmWriter { |
| 372 | int PassSubtarget = 1; |
| 373 | } |
| 374 | |
| Sam Kolton | d63d8a7 | 2016-09-09 09:37:51 +0000 | [diff] [blame] | 375 | def AMDGPUAsmVariants { |
| 376 | string Default = "Default"; |
| 377 | int Default_ID = 0; |
| 378 | string VOP3 = "VOP3"; |
| 379 | int VOP3_ID = 1; |
| 380 | string SDWA = "SDWA"; |
| 381 | int SDWA_ID = 2; |
| 382 | string DPP = "DPP"; |
| 383 | int DPP_ID = 3; |
| Sam Kolton | fb0d9d9 | 2016-09-12 14:42:43 +0000 | [diff] [blame] | 384 | string Disable = "Disable"; |
| 385 | int Disable_ID = 4; |
| Sam Kolton | d63d8a7 | 2016-09-09 09:37:51 +0000 | [diff] [blame] | 386 | } |
| 387 | |
| 388 | def DefaultAMDGPUAsmParserVariant : AsmParserVariant { |
| 389 | let Variant = AMDGPUAsmVariants.Default_ID; |
| 390 | let Name = AMDGPUAsmVariants.Default; |
| 391 | } |
| 392 | |
| 393 | def VOP3AsmParserVariant : AsmParserVariant { |
| 394 | let Variant = AMDGPUAsmVariants.VOP3_ID; |
| 395 | let Name = AMDGPUAsmVariants.VOP3; |
| 396 | } |
| 397 | |
| 398 | def SDWAAsmParserVariant : AsmParserVariant { |
| 399 | let Variant = AMDGPUAsmVariants.SDWA_ID; |
| 400 | let Name = AMDGPUAsmVariants.SDWA; |
| 401 | } |
| 402 | |
| 403 | def DPPAsmParserVariant : AsmParserVariant { |
| 404 | let Variant = AMDGPUAsmVariants.DPP_ID; |
| 405 | let Name = AMDGPUAsmVariants.DPP; |
| 406 | } |
| 407 | |
| Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 408 | def AMDGPU : Target { |
| 409 | // Pull in Instruction Info: |
| 410 | let InstructionSet = AMDGPUInstrInfo; |
| Tom Stellard | 9d7ddd5 | 2014-11-14 14:08:00 +0000 | [diff] [blame] | 411 | let AssemblyParsers = [AMDGPUAsmParser]; |
| Sam Kolton | d63d8a7 | 2016-09-09 09:37:51 +0000 | [diff] [blame] | 412 | let AssemblyParserVariants = [DefaultAMDGPUAsmParserVariant, |
| 413 | VOP3AsmParserVariant, |
| 414 | SDWAAsmParserVariant, |
| 415 | DPPAsmParserVariant]; |
| Konstantin Zhuravlyov | da4687c | 2016-09-27 14:42:48 +0000 | [diff] [blame] | 416 | let AssemblyWriters = [AMDGPUAsmWriter]; |
| Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 417 | } |
| 418 | |
| Tom Stellard | bc5b537 | 2014-06-13 16:38:59 +0000 | [diff] [blame] | 419 | // Dummy Instruction itineraries for pseudo instructions |
| 420 | def ALU_NULL : FuncUnit; |
| 421 | def NullALU : InstrItinClass; |
| 422 | |
| Tom Stellard | 0e70de5 | 2014-05-16 20:56:45 +0000 | [diff] [blame] | 423 | //===----------------------------------------------------------------------===// |
| 424 | // Predicate helper class |
| 425 | //===----------------------------------------------------------------------===// |
| 426 | |
| Tom Stellard | d1f0f02 | 2015-04-23 19:33:54 +0000 | [diff] [blame] | 427 | def TruePredicate : Predicate<"true">; |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 428 | |
| Tom Stellard | d1f0f02 | 2015-04-23 19:33:54 +0000 | [diff] [blame] | 429 | def isSICI : Predicate< |
| 430 | "Subtarget->getGeneration() == AMDGPUSubtarget::SOUTHERN_ISLANDS ||" |
| 431 | "Subtarget->getGeneration() == AMDGPUSubtarget::SEA_ISLANDS" |
| 432 | >, AssemblerPredicate<"FeatureGCN1Encoding">; |
| 433 | |
| Tom Stellard | 5ebdfbe | 2015-12-24 03:18:18 +0000 | [diff] [blame] | 434 | def isVI : Predicate < |
| 435 | "Subtarget->getGeneration() >= AMDGPUSubtarget::VOLCANIC_ISLANDS">, |
| 436 | AssemblerPredicate<"FeatureGCN3Encoding">; |
| 437 | |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 438 | def isCIVI : Predicate < |
| 439 | "Subtarget->getGeneration() == AMDGPUSubtarget::SEA_ISLANDS || " |
| 440 | "Subtarget->getGeneration() == AMDGPUSubtarget::VOLCANIC_ISLANDS" |
| 441 | >, AssemblerPredicate<"FeatureCIInsts">; |
| 442 | |
| 443 | def HasFlatAddressSpace : Predicate<"Subtarget->hasFlatAddressSpace()">; |
| 444 | |
| Tom Stellard | 0e70de5 | 2014-05-16 20:56:45 +0000 | [diff] [blame] | 445 | class PredicateControl { |
| 446 | Predicate SubtargetPredicate; |
| Tom Stellard | d1f0f02 | 2015-04-23 19:33:54 +0000 | [diff] [blame] | 447 | Predicate SIAssemblerPredicate = isSICI; |
| Tom Stellard | 5ebdfbe | 2015-12-24 03:18:18 +0000 | [diff] [blame] | 448 | Predicate VIAssemblerPredicate = isVI; |
| Tom Stellard | d7e6f13 | 2015-04-08 01:09:26 +0000 | [diff] [blame] | 449 | list<Predicate> AssemblerPredicates = []; |
| Tom Stellard | d1f0f02 | 2015-04-23 19:33:54 +0000 | [diff] [blame] | 450 | Predicate AssemblerPredicate = TruePredicate; |
| Tom Stellard | 0e70de5 | 2014-05-16 20:56:45 +0000 | [diff] [blame] | 451 | list<Predicate> OtherPredicates = []; |
| Tom Stellard | d1f0f02 | 2015-04-23 19:33:54 +0000 | [diff] [blame] | 452 | list<Predicate> Predicates = !listconcat([SubtargetPredicate, AssemblerPredicate], |
| Tom Stellard | d7e6f13 | 2015-04-08 01:09:26 +0000 | [diff] [blame] | 453 | AssemblerPredicates, |
| Tom Stellard | 0e70de5 | 2014-05-16 20:56:45 +0000 | [diff] [blame] | 454 | OtherPredicates); |
| 455 | } |
| 456 | |
| Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 457 | // Include AMDGPU TD files |
| 458 | include "R600Schedule.td" |
| 459 | include "SISchedule.td" |
| 460 | include "Processors.td" |
| 461 | include "AMDGPUInstrInfo.td" |
| 462 | include "AMDGPUIntrinsics.td" |
| 463 | include "AMDGPURegisterInfo.td" |
| 464 | include "AMDGPUInstructions.td" |
| Christian Konig | 2c8f6d5 | 2013-03-07 09:03:52 +0000 | [diff] [blame] | 465 | include "AMDGPUCallingConv.td" |