| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 1 | //===-- AMDGPU.td - AMDGPU Tablegen files --------*- tablegen -*-===// |
| Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
| 7 | // |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 8 | //===------------------------------------------------------------===// |
| Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 9 | |
| Tom Stellard | bc5b537 | 2014-06-13 16:38:59 +0000 | [diff] [blame] | 10 | include "llvm/Target/Target.td" |
| Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 11 | |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 12 | //===------------------------------------------------------------===// |
| 13 | // Subtarget Features (device properties) |
| 14 | //===------------------------------------------------------------===// |
| Tom Stellard | 783893a | 2013-11-18 19:43:33 +0000 | [diff] [blame] | 15 | |
| Matt Arsenault | f5e2997 | 2014-06-20 06:50:05 +0000 | [diff] [blame] | 16 | def FeatureFP64 : SubtargetFeature<"fp64", |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 17 | "FP64", |
| 18 | "true", |
| 19 | "Enable double precision operations" |
| 20 | >; |
| Matt Arsenault | f171cf2 | 2014-07-14 23:40:49 +0000 | [diff] [blame] | 21 | |
| Matt Arsenault | b035a57 | 2015-01-29 19:34:25 +0000 | [diff] [blame] | 22 | def FeatureFastFMAF32 : SubtargetFeature<"fast-fmaf", |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 23 | "FastFMAF32", |
| 24 | "true", |
| 25 | "Assuming f32 fma is at least as fast as mul + add" |
| 26 | >; |
| Matt Arsenault | b035a57 | 2015-01-29 19:34:25 +0000 | [diff] [blame] | 27 | |
| Matt Arsenault | e83690c | 2016-01-18 21:13:50 +0000 | [diff] [blame] | 28 | def HalfRate64Ops : SubtargetFeature<"half-rate-64-ops", |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 29 | "HalfRate64Ops", |
| 30 | "true", |
| 31 | "Most fp64 instructions are half rate instead of quarter" |
| 32 | >; |
| Matt Arsenault | f171cf2 | 2014-07-14 23:40:49 +0000 | [diff] [blame] | 33 | |
| Tom Stellard | 9979277 | 2013-06-07 20:28:49 +0000 | [diff] [blame] | 34 | def FeatureR600ALUInst : SubtargetFeature<"R600ALUInst", |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 35 | "R600ALUInst", |
| 36 | "false", |
| 37 | "Older version of ALU instructions encoding" |
| 38 | >; |
| Tom Stellard | 9979277 | 2013-06-07 20:28:49 +0000 | [diff] [blame] | 39 | |
| 40 | def FeatureVertexCache : SubtargetFeature<"HasVertexCache", |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 41 | "HasVertexCache", |
| 42 | "true", |
| 43 | "Specify use of dedicated vertex cache" |
| 44 | >; |
| Tom Stellard | 9979277 | 2013-06-07 20:28:49 +0000 | [diff] [blame] | 45 | |
| Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 46 | def FeatureCaymanISA : SubtargetFeature<"caymanISA", |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 47 | "CaymanISA", |
| 48 | "true", |
| 49 | "Use Cayman ISA" |
| 50 | >; |
| Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 51 | |
| Tom Stellard | 348273d | 2014-01-23 16:18:02 +0000 | [diff] [blame] | 52 | def FeatureCFALUBug : SubtargetFeature<"cfalubug", |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 53 | "CFALUBug", |
| 54 | "true", |
| 55 | "GPU has CF_ALU bug" |
| 56 | >; |
| Changpeng Fang | b41574a | 2015-12-22 20:55:23 +0000 | [diff] [blame] | 57 | |
| Matt Arsenault | 3f98140 | 2014-09-15 15:41:53 +0000 | [diff] [blame] | 58 | def FeatureFlatAddressSpace : SubtargetFeature<"flat-address-space", |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 59 | "FlatAddressSpace", |
| 60 | "true", |
| 61 | "Support flat address space" |
| 62 | >; |
| Matt Arsenault | 3f98140 | 2014-09-15 15:41:53 +0000 | [diff] [blame] | 63 | |
| Matt Arsenault | acdc765 | 2017-05-10 21:19:05 +0000 | [diff] [blame] | 64 | def FeatureFlatInstOffsets : SubtargetFeature<"flat-inst-offsets", |
| 65 | "FlatInstOffsets", |
| 66 | "true", |
| 67 | "Flat instructions have immediate offset addressing mode" |
| 68 | >; |
| 69 | |
| 70 | def FeatureFlatGlobalInsts : SubtargetFeature<"flat-global-insts", |
| 71 | "FlatGlobalInsts", |
| 72 | "true", |
| 73 | "Have global_* flat memory instructions" |
| 74 | >; |
| 75 | |
| 76 | def FeatureFlatScratchInsts : SubtargetFeature<"flat-scratch-insts", |
| 77 | "FlatScratchInsts", |
| 78 | "true", |
| 79 | "Have scratch_* flat memory instructions" |
| 80 | >; |
| 81 | |
| Matt Arsenault | c37fe66 | 2017-07-20 17:42:47 +0000 | [diff] [blame] | 82 | def FeatureAddNoCarryInsts : SubtargetFeature<"add-no-carry-insts", |
| 83 | "AddNoCarryInsts", |
| 84 | "true", |
| 85 | "Have VALU add/sub instructions without carry out" |
| 86 | >; |
| 87 | |
| Matt Arsenault | 7f681ac | 2016-07-01 23:03:44 +0000 | [diff] [blame] | 88 | def FeatureUnalignedBufferAccess : SubtargetFeature<"unaligned-buffer-access", |
| 89 | "UnalignedBufferAccess", |
| 90 | "true", |
| 91 | "Support unaligned global loads and stores" |
| 92 | >; |
| 93 | |
| Wei Ding | 205bfdb | 2017-02-10 02:15:29 +0000 | [diff] [blame] | 94 | def FeatureTrapHandler: SubtargetFeature<"trap-handler", |
| 95 | "TrapHandler", |
| 96 | "true", |
| 97 | "Trap handler support" |
| 98 | >; |
| 99 | |
| Tom Stellard | 64a9d08 | 2016-10-14 18:10:39 +0000 | [diff] [blame] | 100 | def FeatureUnalignedScratchAccess : SubtargetFeature<"unaligned-scratch-access", |
| 101 | "UnalignedScratchAccess", |
| 102 | "true", |
| 103 | "Support unaligned scratch loads and stores" |
| 104 | >; |
| 105 | |
| Matt Arsenault | e823d92 | 2017-02-18 18:29:53 +0000 | [diff] [blame] | 106 | def FeatureApertureRegs : SubtargetFeature<"aperture-regs", |
| 107 | "HasApertureRegs", |
| 108 | "true", |
| 109 | "Has Memory Aperture Base and Size Registers" |
| 110 | >; |
| 111 | |
| Matt Arsenault | 28f52e5 | 2017-10-25 07:00:51 +0000 | [diff] [blame] | 112 | def FeatureMadMixInsts : SubtargetFeature<"mad-mix-insts", |
| 113 | "HasMadMixInsts", |
| 114 | "true", |
| 115 | "Has v_mad_mix_f32, v_mad_mixlo_f16, v_mad_mixhi_f16 instructions" |
| 116 | >; |
| 117 | |
| Marek Olsak | 0f55fba | 2016-12-09 19:49:54 +0000 | [diff] [blame] | 118 | // XNACK is disabled if SH_MEM_CONFIG.ADDRESS_MODE = GPUVM on chips that support |
| 119 | // XNACK. The current default kernel driver setting is: |
| 120 | // - graphics ring: XNACK disabled |
| 121 | // - compute ring: XNACK enabled |
| 122 | // |
| 123 | // If XNACK is enabled, the VMEM latency can be worse. |
| 124 | // If XNACK is disabled, the 2 SGPRs can be used for general purposes. |
| Nicolai Haehnle | 5b50497 | 2016-01-04 23:35:53 +0000 | [diff] [blame] | 125 | def FeatureXNACK : SubtargetFeature<"xnack", |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 126 | "EnableXNACK", |
| 127 | "true", |
| 128 | "Enable XNACK support" |
| 129 | >; |
| Tom Stellard | e99fb65 | 2015-01-20 19:33:04 +0000 | [diff] [blame] | 130 | |
| Marek Olsak | 4d00dd2 | 2015-03-09 15:48:09 +0000 | [diff] [blame] | 131 | def FeatureSGPRInitBug : SubtargetFeature<"sgpr-init-bug", |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 132 | "SGPRInitBug", |
| 133 | "true", |
| Matt Arsenault | a7eb14af | 2017-08-06 18:13:23 +0000 | [diff] [blame] | 134 | "VI SGPR initialization bug requiring a fixed SGPR allocation size" |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 135 | >; |
| Tom Stellard | de008d3 | 2016-01-21 04:28:34 +0000 | [diff] [blame] | 136 | |
| Tom Stellard | 3498e4f | 2013-06-07 20:28:55 +0000 | [diff] [blame] | 137 | class SubtargetFeatureFetchLimit <string Value> : |
| 138 | SubtargetFeature <"fetch"#Value, |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 139 | "TexVTXClauseSize", |
| 140 | Value, |
| 141 | "Limit the maximum number of fetches in a clause to "#Value |
| 142 | >; |
| Tom Stellard | 9979277 | 2013-06-07 20:28:49 +0000 | [diff] [blame] | 143 | |
| Tom Stellard | 3498e4f | 2013-06-07 20:28:55 +0000 | [diff] [blame] | 144 | def FeatureFetchLimit8 : SubtargetFeatureFetchLimit <"8">; |
| 145 | def FeatureFetchLimit16 : SubtargetFeatureFetchLimit <"16">; |
| 146 | |
| Tom Stellard | 8c347b0 | 2014-01-22 21:55:40 +0000 | [diff] [blame] | 147 | class SubtargetFeatureWavefrontSize <int Value> : SubtargetFeature< |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 148 | "wavefrontsize"#Value, |
| 149 | "WavefrontSize", |
| 150 | !cast<string>(Value), |
| 151 | "The number of threads per wavefront" |
| 152 | >; |
| Tom Stellard | 8c347b0 | 2014-01-22 21:55:40 +0000 | [diff] [blame] | 153 | |
| 154 | def FeatureWavefrontSize16 : SubtargetFeatureWavefrontSize<16>; |
| 155 | def FeatureWavefrontSize32 : SubtargetFeatureWavefrontSize<32>; |
| 156 | def FeatureWavefrontSize64 : SubtargetFeatureWavefrontSize<64>; |
| 157 | |
| Tom Stellard | ec87f84 | 2015-05-25 16:15:54 +0000 | [diff] [blame] | 158 | class SubtargetFeatureLDSBankCount <int Value> : SubtargetFeature < |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 159 | "ldsbankcount"#Value, |
| 160 | "LDSBankCount", |
| 161 | !cast<string>(Value), |
| 162 | "The number of LDS banks per compute unit." |
| 163 | >; |
| Tom Stellard | ec87f84 | 2015-05-25 16:15:54 +0000 | [diff] [blame] | 164 | |
| 165 | def FeatureLDSBankCount16 : SubtargetFeatureLDSBankCount<16>; |
| 166 | def FeatureLDSBankCount32 : SubtargetFeatureLDSBankCount<32>; |
| 167 | |
| Tom Stellard | 880a80a | 2014-06-17 16:53:14 +0000 | [diff] [blame] | 168 | class SubtargetFeatureLocalMemorySize <int Value> : SubtargetFeature< |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 169 | "localmemorysize"#Value, |
| 170 | "LocalMemorySize", |
| 171 | !cast<string>(Value), |
| 172 | "The size of local memory in bytes" |
| 173 | >; |
| Tom Stellard | 880a80a | 2014-06-17 16:53:14 +0000 | [diff] [blame] | 174 | |
| Tom Stellard | d7e6f13 | 2015-04-08 01:09:26 +0000 | [diff] [blame] | 175 | def FeatureGCN : SubtargetFeature<"gcn", |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 176 | "IsGCN", |
| 177 | "true", |
| 178 | "GCN or newer GPU" |
| 179 | >; |
| Tom Stellard | d7e6f13 | 2015-04-08 01:09:26 +0000 | [diff] [blame] | 180 | |
| Tom Stellard | d7e6f13 | 2015-04-08 01:09:26 +0000 | [diff] [blame] | 181 | def FeatureGCN3Encoding : SubtargetFeature<"gcn3-encoding", |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 182 | "GCN3Encoding", |
| 183 | "true", |
| 184 | "Encoding format for VI" |
| 185 | >; |
| Tom Stellard | d1f0f02 | 2015-04-23 19:33:54 +0000 | [diff] [blame] | 186 | |
| 187 | def FeatureCIInsts : SubtargetFeature<"ci-insts", |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 188 | "CIInsts", |
| 189 | "true", |
| Matt Arsenault | c6baa85 | 2017-10-02 20:31:18 +0000 | [diff] [blame] | 190 | "Additional instructions for CI+" |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 191 | >; |
| 192 | |
| Matt Arsenault | 2021f08 | 2017-02-18 19:12:26 +0000 | [diff] [blame] | 193 | def FeatureGFX9Insts : SubtargetFeature<"gfx9-insts", |
| 194 | "GFX9Insts", |
| 195 | "true", |
| Matt Arsenault | c6baa85 | 2017-10-02 20:31:18 +0000 | [diff] [blame] | 196 | "Additional instructions for GFX9+" |
| Matt Arsenault | 2021f08 | 2017-02-18 19:12:26 +0000 | [diff] [blame] | 197 | >; |
| 198 | |
| Matt Arsenault | 9d82ee7 | 2016-02-27 08:53:55 +0000 | [diff] [blame] | 199 | def FeatureSMemRealTime : SubtargetFeature<"s-memrealtime", |
| 200 | "HasSMemRealTime", |
| Matt Arsenault | 61738cb | 2016-02-27 08:53:46 +0000 | [diff] [blame] | 201 | "true", |
| Matt Arsenault | 9d82ee7 | 2016-02-27 08:53:55 +0000 | [diff] [blame] | 202 | "Has s_memrealtime instruction" |
| 203 | >; |
| 204 | |
| Matt Arsenault | c88ba36 | 2016-10-29 04:05:06 +0000 | [diff] [blame] | 205 | def FeatureInv2PiInlineImm : SubtargetFeature<"inv-2pi-inline-imm", |
| 206 | "HasInv2PiInlineImm", |
| 207 | "true", |
| 208 | "Has 1 / (2 * pi) as inline immediate" |
| 209 | >; |
| 210 | |
| Matt Arsenault | 9d82ee7 | 2016-02-27 08:53:55 +0000 | [diff] [blame] | 211 | def Feature16BitInsts : SubtargetFeature<"16-bit-insts", |
| 212 | "Has16BitInsts", |
| 213 | "true", |
| 214 | "Has i16/f16 instructions" |
| Matt Arsenault | 61738cb | 2016-02-27 08:53:46 +0000 | [diff] [blame] | 215 | >; |
| 216 | |
| Matt Arsenault | 9be7b0d | 2017-02-27 18:49:11 +0000 | [diff] [blame] | 217 | def FeatureVOP3P : SubtargetFeature<"vop3p", |
| 218 | "HasVOP3PInsts", |
| 219 | "true", |
| 220 | "Has VOP3P packed instructions" |
| 221 | >; |
| 222 | |
| Matt Arsenault | cc88ce3 | 2016-10-12 18:00:51 +0000 | [diff] [blame] | 223 | def FeatureMovrel : SubtargetFeature<"movrel", |
| 224 | "HasMovrel", |
| 225 | "true", |
| 226 | "Has v_movrel*_b32 instructions" |
| 227 | >; |
| 228 | |
| 229 | def FeatureVGPRIndexMode : SubtargetFeature<"vgpr-index-mode", |
| 230 | "HasVGPRIndexMode", |
| 231 | "true", |
| 232 | "Has VGPR mode register indexing" |
| 233 | >; |
| 234 | |
| Matt Arsenault | 7b64755 | 2016-10-28 21:55:15 +0000 | [diff] [blame] | 235 | def FeatureScalarStores : SubtargetFeature<"scalar-stores", |
| 236 | "HasScalarStores", |
| 237 | "true", |
| 238 | "Has store scalar memory instructions" |
| 239 | >; |
| 240 | |
| Sam Kolton | 07dbde2 | 2017-01-20 10:01:25 +0000 | [diff] [blame] | 241 | def FeatureSDWA : SubtargetFeature<"sdwa", |
| 242 | "HasSDWA", |
| 243 | "true", |
| 244 | "Support SDWA (Sub-DWORD Addressing) extension" |
| 245 | >; |
| 246 | |
| Sam Kolton | 3c4933f | 2017-06-22 06:26:41 +0000 | [diff] [blame] | 247 | def FeatureSDWAOmod : SubtargetFeature<"sdwa-omod", |
| 248 | "HasSDWAOmod", |
| 249 | "true", |
| 250 | "Support OMod with SDWA (Sub-DWORD Addressing) extension" |
| 251 | >; |
| 252 | |
| 253 | def FeatureSDWAScalar : SubtargetFeature<"sdwa-scalar", |
| 254 | "HasSDWAScalar", |
| 255 | "true", |
| 256 | "Support scalar register with SDWA (Sub-DWORD Addressing) extension" |
| 257 | >; |
| 258 | |
| 259 | def FeatureSDWASdst : SubtargetFeature<"sdwa-sdst", |
| 260 | "HasSDWASdst", |
| 261 | "true", |
| 262 | "Support scalar dst for VOPC with SDWA (Sub-DWORD Addressing) extension" |
| 263 | >; |
| 264 | |
| 265 | def FeatureSDWAMac : SubtargetFeature<"sdwa-mav", |
| 266 | "HasSDWAMac", |
| 267 | "true", |
| 268 | "Support v_mac_f32/f16 with SDWA (Sub-DWORD Addressing) extension" |
| 269 | >; |
| 270 | |
| Sam Kolton | a179d25 | 2017-06-27 15:02:23 +0000 | [diff] [blame] | 271 | def FeatureSDWAOutModsVOPC : SubtargetFeature<"sdwa-out-mods-vopc", |
| 272 | "HasSDWAOutModsVOPC", |
| Sam Kolton | 3c4933f | 2017-06-22 06:26:41 +0000 | [diff] [blame] | 273 | "true", |
| 274 | "Support clamp for VOPC with SDWA (Sub-DWORD Addressing) extension" |
| 275 | >; |
| 276 | |
| Sam Kolton | 07dbde2 | 2017-01-20 10:01:25 +0000 | [diff] [blame] | 277 | def FeatureDPP : SubtargetFeature<"dpp", |
| 278 | "HasDPP", |
| 279 | "true", |
| 280 | "Support DPP (Data Parallel Primitives) extension" |
| 281 | >; |
| 282 | |
| Dmitry Preobrazhensky | ff64aa5 | 2017-08-16 13:51:56 +0000 | [diff] [blame] | 283 | def FeatureIntClamp : SubtargetFeature<"int-clamp-insts", |
| 284 | "HasIntClamp", |
| 285 | "true", |
| 286 | "Support clamp for integer destination" |
| 287 | >; |
| 288 | |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 289 | //===------------------------------------------------------------===// |
| 290 | // Subtarget Features (options and debugging) |
| 291 | //===------------------------------------------------------------===// |
| 292 | |
| 293 | // Some instructions do not support denormals despite this flag. Using |
| 294 | // fp32 denormals also causes instructions to run at the double |
| 295 | // precision rate for the device. |
| 296 | def FeatureFP32Denormals : SubtargetFeature<"fp32-denormals", |
| 297 | "FP32Denormals", |
| 298 | "true", |
| 299 | "Enable single precision denormal handling" |
| 300 | >; |
| 301 | |
| Matt Arsenault | a6867fd | 2017-01-23 22:31:03 +0000 | [diff] [blame] | 302 | // Denormal handling for fp64 and fp16 is controlled by the same |
| 303 | // config register when fp16 supported. |
| 304 | // TODO: Do we need a separate f16 setting when not legal? |
| 305 | def FeatureFP64FP16Denormals : SubtargetFeature<"fp64-fp16-denormals", |
| 306 | "FP64FP16Denormals", |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 307 | "true", |
| Matt Arsenault | a6867fd | 2017-01-23 22:31:03 +0000 | [diff] [blame] | 308 | "Enable double and half precision denormal handling", |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 309 | [FeatureFP64] |
| 310 | >; |
| 311 | |
| Matt Arsenault | a6867fd | 2017-01-23 22:31:03 +0000 | [diff] [blame] | 312 | def FeatureFP64Denormals : SubtargetFeature<"fp64-denormals", |
| 313 | "FP64FP16Denormals", |
| 314 | "true", |
| 315 | "Enable double and half precision denormal handling", |
| 316 | [FeatureFP64, FeatureFP64FP16Denormals] |
| 317 | >; |
| 318 | |
| 319 | def FeatureFP16Denormals : SubtargetFeature<"fp16-denormals", |
| 320 | "FP64FP16Denormals", |
| 321 | "true", |
| 322 | "Enable half precision denormal handling", |
| 323 | [FeatureFP64FP16Denormals] |
| 324 | >; |
| 325 | |
| Matt Arsenault | 2fdf2a1 | 2017-02-21 23:35:48 +0000 | [diff] [blame] | 326 | def FeatureDX10Clamp : SubtargetFeature<"dx10-clamp", |
| 327 | "DX10Clamp", |
| 328 | "true", |
| 329 | "clamp modifier clamps NaNs to 0.0" |
| 330 | >; |
| 331 | |
| Matt Arsenault | f639c32 | 2016-01-28 20:53:42 +0000 | [diff] [blame] | 332 | def FeatureFPExceptions : SubtargetFeature<"fp-exceptions", |
| 333 | "FPExceptions", |
| 334 | "true", |
| 335 | "Enable floating point exceptions" |
| 336 | >; |
| 337 | |
| Matt Arsenault | 24ee078 | 2016-02-12 02:40:47 +0000 | [diff] [blame] | 338 | class FeatureMaxPrivateElementSize<int size> : SubtargetFeature< |
| 339 | "max-private-element-size-"#size, |
| 340 | "MaxPrivateElementSize", |
| 341 | !cast<string>(size), |
| 342 | "Maximum private access size may be "#size |
| 343 | >; |
| 344 | |
| 345 | def FeatureMaxPrivateElementSize4 : FeatureMaxPrivateElementSize<4>; |
| 346 | def FeatureMaxPrivateElementSize8 : FeatureMaxPrivateElementSize<8>; |
| 347 | def FeatureMaxPrivateElementSize16 : FeatureMaxPrivateElementSize<16>; |
| 348 | |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 349 | def FeatureVGPRSpilling : SubtargetFeature<"vgpr-spilling", |
| 350 | "EnableVGPRSpilling", |
| 351 | "true", |
| 352 | "Enable spilling of VGPRs to scratch memory" |
| 353 | >; |
| 354 | |
| 355 | def FeatureDumpCode : SubtargetFeature <"DumpCode", |
| 356 | "DumpCode", |
| 357 | "true", |
| 358 | "Dump MachineInstrs in the CodeEmitter" |
| 359 | >; |
| 360 | |
| 361 | def FeatureDumpCodeLower : SubtargetFeature <"dumpcode", |
| 362 | "DumpCode", |
| 363 | "true", |
| 364 | "Dump MachineInstrs in the CodeEmitter" |
| 365 | >; |
| 366 | |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 367 | def FeaturePromoteAlloca : SubtargetFeature <"promote-alloca", |
| 368 | "EnablePromoteAlloca", |
| 369 | "true", |
| 370 | "Enable promote alloca pass" |
| 371 | >; |
| 372 | |
| 373 | // XXX - This should probably be removed once enabled by default |
| 374 | def FeatureEnableLoadStoreOpt : SubtargetFeature <"load-store-opt", |
| 375 | "EnableLoadStoreOpt", |
| 376 | "true", |
| 377 | "Enable SI load/store optimizer pass" |
| 378 | >; |
| 379 | |
| 380 | // Performance debugging feature. Allow using DS instruction immediate |
| 381 | // offsets even if the base pointer can't be proven to be base. On SI, |
| 382 | // base pointer values that won't give the same result as a 16-bit add |
| 383 | // are not safe to fold, but this will override the conservative test |
| 384 | // for the base pointer. |
| 385 | def FeatureEnableUnsafeDSOffsetFolding : SubtargetFeature < |
| 386 | "unsafe-ds-offset-folding", |
| 387 | "EnableUnsafeDSOffsetFolding", |
| 388 | "true", |
| 389 | "Force using DS instruction immediate offsets on SI" |
| 390 | >; |
| 391 | |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 392 | def FeatureEnableSIScheduler : SubtargetFeature<"si-scheduler", |
| 393 | "EnableSIScheduler", |
| 394 | "true", |
| 395 | "Enable SI Machine Scheduler" |
| 396 | >; |
| 397 | |
| Matt Arsenault | 7aad8fd | 2017-01-24 22:02:15 +0000 | [diff] [blame] | 398 | // Unless +-flat-for-global is specified, turn on FlatForGlobal for |
| 399 | // all OS-es on VI and newer hardware to avoid assertion failures due |
| 400 | // to missing ADDR64 variants of MUBUF instructions. |
| 401 | // FIXME: moveToVALU should be able to handle converting addr64 MUBUF |
| 402 | // instructions. |
| 403 | |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 404 | def FeatureFlatForGlobal : SubtargetFeature<"flat-for-global", |
| 405 | "FlatForGlobal", |
| 406 | "true", |
| Matt Arsenault | d8f7ea3 | 2017-01-27 17:42:26 +0000 | [diff] [blame] | 407 | "Force to generate flat instruction for global" |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 408 | >; |
| Tom Stellard | d1f0f02 | 2015-04-23 19:33:54 +0000 | [diff] [blame] | 409 | |
| Konstantin Zhuravlyov | be6c0ca | 2017-06-02 17:40:26 +0000 | [diff] [blame] | 410 | def FeatureAutoWaitcntBeforeBarrier : SubtargetFeature < |
| 411 | "auto-waitcnt-before-barrier", |
| 412 | "AutoWaitcntBeforeBarrier", |
| 413 | "true", |
| 414 | "Hardware automatically inserts waitcnt before barrier" |
| 415 | >; |
| 416 | |
| Konstantin Zhuravlyov | eda425e | 2017-10-14 15:59:07 +0000 | [diff] [blame] | 417 | def FeatureCodeObjectV3 : SubtargetFeature < |
| 418 | "code-object-v3", |
| 419 | "CodeObjectV3", |
| 420 | "true", |
| 421 | "Generate code object version 3" |
| 422 | >; |
| 423 | |
| Tom Stellard | d1f0f02 | 2015-04-23 19:33:54 +0000 | [diff] [blame] | 424 | // Dummy feature used to disable assembler instructions. |
| 425 | def FeatureDisable : SubtargetFeature<"", |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 426 | "FeatureDisable","true", |
| 427 | "Dummy feature to disable assembler instructions" |
| 428 | >; |
| Tom Stellard | d1f0f02 | 2015-04-23 19:33:54 +0000 | [diff] [blame] | 429 | |
| Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 430 | class SubtargetFeatureGeneration <string Value, |
| 431 | list<SubtargetFeature> Implies> : |
| 432 | SubtargetFeature <Value, "Gen", "AMDGPUSubtarget::"#Value, |
| 433 | Value#" GPU generation", Implies>; |
| 434 | |
| Tom Stellard | 880a80a | 2014-06-17 16:53:14 +0000 | [diff] [blame] | 435 | def FeatureLocalMemorySize0 : SubtargetFeatureLocalMemorySize<0>; |
| 436 | def FeatureLocalMemorySize32768 : SubtargetFeatureLocalMemorySize<32768>; |
| 437 | def FeatureLocalMemorySize65536 : SubtargetFeatureLocalMemorySize<65536>; |
| 438 | |
| Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 439 | def FeatureR600 : SubtargetFeatureGeneration<"R600", |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 440 | [FeatureR600ALUInst, FeatureFetchLimit8, FeatureLocalMemorySize0] |
| 441 | >; |
| Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 442 | |
| 443 | def FeatureR700 : SubtargetFeatureGeneration<"R700", |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 444 | [FeatureFetchLimit16, FeatureLocalMemorySize0] |
| 445 | >; |
| Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 446 | |
| 447 | def FeatureEvergreen : SubtargetFeatureGeneration<"EVERGREEN", |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 448 | [FeatureFetchLimit16, FeatureLocalMemorySize32768] |
| 449 | >; |
| Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 450 | |
| 451 | def FeatureNorthernIslands : SubtargetFeatureGeneration<"NORTHERN_ISLANDS", |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 452 | [FeatureFetchLimit16, FeatureWavefrontSize64, |
| 453 | FeatureLocalMemorySize32768] |
| Tom Stellard | 880a80a | 2014-06-17 16:53:14 +0000 | [diff] [blame] | 454 | >; |
| Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 455 | |
| 456 | def FeatureSouthernIslands : SubtargetFeatureGeneration<"SOUTHERN_ISLANDS", |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 457 | [FeatureFP64, FeatureLocalMemorySize32768, |
| Matt Arsenault | 8728c5f | 2017-08-07 14:58:04 +0000 | [diff] [blame] | 458 | FeatureWavefrontSize64, FeatureGCN, |
| Matt Arsenault | cc88ce3 | 2016-10-12 18:00:51 +0000 | [diff] [blame] | 459 | FeatureLDSBankCount32, FeatureMovrel] |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 460 | >; |
| Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 461 | |
| Tom Stellard | 6e1ee47 | 2013-10-29 16:37:28 +0000 | [diff] [blame] | 462 | def FeatureSeaIslands : SubtargetFeatureGeneration<"SEA_ISLANDS", |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 463 | [FeatureFP64, FeatureLocalMemorySize65536, |
| 464 | FeatureWavefrontSize64, FeatureGCN, FeatureFlatAddressSpace, |
| Matt Arsenault | 8728c5f | 2017-08-07 14:58:04 +0000 | [diff] [blame] | 465 | FeatureCIInsts, FeatureMovrel] |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 466 | >; |
| Marek Olsak | 5df00d6 | 2014-12-07 12:18:57 +0000 | [diff] [blame] | 467 | |
| 468 | def FeatureVolcanicIslands : SubtargetFeatureGeneration<"VOLCANIC_ISLANDS", |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 469 | [FeatureFP64, FeatureLocalMemorySize65536, |
| 470 | FeatureWavefrontSize64, FeatureFlatAddressSpace, FeatureGCN, |
| Matt Arsenault | 9d82ee7 | 2016-02-27 08:53:55 +0000 | [diff] [blame] | 471 | FeatureGCN3Encoding, FeatureCIInsts, Feature16BitInsts, |
| Matt Arsenault | 7b64755 | 2016-10-28 21:55:15 +0000 | [diff] [blame] | 472 | FeatureSMemRealTime, FeatureVGPRIndexMode, FeatureMovrel, |
| Sam Kolton | 3c4933f | 2017-06-22 06:26:41 +0000 | [diff] [blame] | 473 | FeatureScalarStores, FeatureInv2PiInlineImm, |
| Dmitry Preobrazhensky | ff64aa5 | 2017-08-16 13:51:56 +0000 | [diff] [blame] | 474 | FeatureSDWA, FeatureSDWAOutModsVOPC, FeatureSDWAMac, FeatureDPP, |
| 475 | FeatureIntClamp |
| Matt Arsenault | 9d82ee7 | 2016-02-27 08:53:55 +0000 | [diff] [blame] | 476 | ] |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 477 | >; |
| Marek Olsak | 5df00d6 | 2014-12-07 12:18:57 +0000 | [diff] [blame] | 478 | |
| Matt Arsenault | e823d92 | 2017-02-18 18:29:53 +0000 | [diff] [blame] | 479 | def FeatureGFX9 : SubtargetFeatureGeneration<"GFX9", |
| 480 | [FeatureFP64, FeatureLocalMemorySize65536, |
| 481 | FeatureWavefrontSize64, FeatureFlatAddressSpace, FeatureGCN, |
| 482 | FeatureGCN3Encoding, FeatureCIInsts, Feature16BitInsts, |
| 483 | FeatureSMemRealTime, FeatureScalarStores, FeatureInv2PiInlineImm, |
| Konstantin Zhuravlyov | f628406 | 2017-04-21 19:57:53 +0000 | [diff] [blame] | 484 | FeatureApertureRegs, FeatureGFX9Insts, FeatureVOP3P, FeatureVGPRIndexMode, |
| Dmitry Preobrazhensky | ff64aa5 | 2017-08-16 13:51:56 +0000 | [diff] [blame] | 485 | FeatureFastFMAF32, FeatureDPP, FeatureIntClamp, |
| Sam Kolton | 3c4933f | 2017-06-22 06:26:41 +0000 | [diff] [blame] | 486 | FeatureSDWA, FeatureSDWAOmod, FeatureSDWAScalar, FeatureSDWASdst, |
| Matt Arsenault | c37fe66 | 2017-07-20 17:42:47 +0000 | [diff] [blame] | 487 | FeatureFlatInstOffsets, FeatureFlatGlobalInsts, FeatureFlatScratchInsts, |
| 488 | FeatureAddNoCarryInsts |
| Matt Arsenault | e823d92 | 2017-02-18 18:29:53 +0000 | [diff] [blame] | 489 | ] |
| 490 | >; |
| 491 | |
| Yaxun Liu | 94add85 | 2016-10-26 16:37:56 +0000 | [diff] [blame] | 492 | class SubtargetFeatureISAVersion <int Major, int Minor, int Stepping, |
| 493 | list<SubtargetFeature> Implies> |
| 494 | : SubtargetFeature < |
| 495 | "isaver"#Major#"."#Minor#"."#Stepping, |
| 496 | "IsaVersion", |
| 497 | "ISAVersion"#Major#"_"#Minor#"_"#Stepping, |
| 498 | "Instruction set version number", |
| 499 | Implies |
| 500 | >; |
| 501 | |
| Wei Ding | 7c3e511 | 2017-06-10 03:53:19 +0000 | [diff] [blame] | 502 | def FeatureISAVersion6_0_0 : SubtargetFeatureISAVersion <6,0,0, |
| 503 | [FeatureSouthernIslands, |
| Matt Arsenault | 8bcf2f2 | 2017-06-26 03:01:36 +0000 | [diff] [blame] | 504 | FeatureFastFMAF32, |
| Wei Ding | 7c3e511 | 2017-06-10 03:53:19 +0000 | [diff] [blame] | 505 | HalfRate64Ops, |
| 506 | FeatureLDSBankCount32]>; |
| 507 | |
| 508 | def FeatureISAVersion6_0_1 : SubtargetFeatureISAVersion <6,0,1, |
| 509 | [FeatureSouthernIslands, |
| 510 | FeatureLDSBankCount32]>; |
| Matt Arsenault | 8bcf2f2 | 2017-06-26 03:01:36 +0000 | [diff] [blame] | 511 | |
| Matt Arsenault | f3dd863 | 2016-11-01 00:55:14 +0000 | [diff] [blame] | 512 | def FeatureISAVersion7_0_0 : SubtargetFeatureISAVersion <7,0,0, |
| Yaxun Liu | 94add85 | 2016-10-26 16:37:56 +0000 | [diff] [blame] | 513 | [FeatureSeaIslands, |
| 514 | FeatureLDSBankCount32]>; |
| Matt Arsenault | f3dd863 | 2016-11-01 00:55:14 +0000 | [diff] [blame] | 515 | |
| Yaxun Liu | 94add85 | 2016-10-26 16:37:56 +0000 | [diff] [blame] | 516 | def FeatureISAVersion7_0_1 : SubtargetFeatureISAVersion <7,0,1, |
| 517 | [FeatureSeaIslands, |
| 518 | HalfRate64Ops, |
| 519 | FeatureLDSBankCount32, |
| 520 | FeatureFastFMAF32]>; |
| Matt Arsenault | f3dd863 | 2016-11-01 00:55:14 +0000 | [diff] [blame] | 521 | |
| Yaxun Liu | 94add85 | 2016-10-26 16:37:56 +0000 | [diff] [blame] | 522 | def FeatureISAVersion7_0_2 : SubtargetFeatureISAVersion <7,0,2, |
| 523 | [FeatureSeaIslands, |
| Marek Olsak | 23ae31c | 2016-12-09 19:49:58 +0000 | [diff] [blame] | 524 | FeatureLDSBankCount16]>; |
| Matt Arsenault | f3dd863 | 2016-11-01 00:55:14 +0000 | [diff] [blame] | 525 | |
| Wei Ding | 7c3e511 | 2017-06-10 03:53:19 +0000 | [diff] [blame] | 526 | def FeatureISAVersion7_0_3 : SubtargetFeatureISAVersion <7,0,3, |
| 527 | [FeatureSeaIslands, |
| 528 | FeatureLDSBankCount16]>; |
| 529 | |
| Yaxun Liu | 94add85 | 2016-10-26 16:37:56 +0000 | [diff] [blame] | 530 | def FeatureISAVersion8_0_0 : SubtargetFeatureISAVersion <8,0,0, |
| 531 | [FeatureVolcanicIslands, |
| 532 | FeatureLDSBankCount32, |
| 533 | FeatureSGPRInitBug]>; |
| Matt Arsenault | f3dd863 | 2016-11-01 00:55:14 +0000 | [diff] [blame] | 534 | |
| Yaxun Liu | 94add85 | 2016-10-26 16:37:56 +0000 | [diff] [blame] | 535 | def FeatureISAVersion8_0_1 : SubtargetFeatureISAVersion <8,0,1, |
| 536 | [FeatureVolcanicIslands, |
| Konstantin Zhuravlyov | 6810765 | 2017-08-24 20:03:07 +0000 | [diff] [blame] | 537 | FeatureFastFMAF32, |
| 538 | HalfRate64Ops, |
| Yaxun Liu | 94add85 | 2016-10-26 16:37:56 +0000 | [diff] [blame] | 539 | FeatureLDSBankCount32, |
| 540 | FeatureXNACK]>; |
| Matt Arsenault | f3dd863 | 2016-11-01 00:55:14 +0000 | [diff] [blame] | 541 | |
| Yaxun Liu | 94add85 | 2016-10-26 16:37:56 +0000 | [diff] [blame] | 542 | def FeatureISAVersion8_0_2 : SubtargetFeatureISAVersion <8,0,2, |
| 543 | [FeatureVolcanicIslands, |
| 544 | FeatureLDSBankCount32, |
| 545 | FeatureSGPRInitBug]>; |
| Matt Arsenault | f3dd863 | 2016-11-01 00:55:14 +0000 | [diff] [blame] | 546 | |
| Yaxun Liu | 94add85 | 2016-10-26 16:37:56 +0000 | [diff] [blame] | 547 | def FeatureISAVersion8_0_3 : SubtargetFeatureISAVersion <8,0,3, |
| 548 | [FeatureVolcanicIslands, |
| 549 | FeatureLDSBankCount32]>; |
| Matt Arsenault | f3dd863 | 2016-11-01 00:55:14 +0000 | [diff] [blame] | 550 | |
| Yaxun Liu | 94add85 | 2016-10-26 16:37:56 +0000 | [diff] [blame] | 551 | def FeatureISAVersion8_0_4 : SubtargetFeatureISAVersion <8,0,4, |
| 552 | [FeatureVolcanicIslands, |
| 553 | FeatureLDSBankCount32]>; |
| Matt Arsenault | f3dd863 | 2016-11-01 00:55:14 +0000 | [diff] [blame] | 554 | |
| Yaxun Liu | 94add85 | 2016-10-26 16:37:56 +0000 | [diff] [blame] | 555 | def FeatureISAVersion8_1_0 : SubtargetFeatureISAVersion <8,1,0, |
| 556 | [FeatureVolcanicIslands, |
| 557 | FeatureLDSBankCount16, |
| 558 | FeatureXNACK]>; |
| 559 | |
| Wei Ding | 7c3e511 | 2017-06-10 03:53:19 +0000 | [diff] [blame] | 560 | def FeatureISAVersion9_0_0 : SubtargetFeatureISAVersion <9,0,0, |
| 561 | [FeatureGFX9, |
| Matt Arsenault | 28f52e5 | 2017-10-25 07:00:51 +0000 | [diff] [blame] | 562 | FeatureMadMixInsts, |
| 563 | FeatureLDSBankCount32 |
| 564 | ]>; |
| Wei Ding | 7c3e511 | 2017-06-10 03:53:19 +0000 | [diff] [blame] | 565 | |
| 566 | def FeatureISAVersion9_0_1 : SubtargetFeatureISAVersion <9,0,1, |
| 567 | [FeatureGFX9, |
| Matt Arsenault | 28f52e5 | 2017-10-25 07:00:51 +0000 | [diff] [blame] | 568 | FeatureMadMixInsts, |
| Wei Ding | 7c3e511 | 2017-06-10 03:53:19 +0000 | [diff] [blame] | 569 | FeatureLDSBankCount32, |
| 570 | FeatureXNACK]>; |
| 571 | |
| 572 | def FeatureISAVersion9_0_2 : SubtargetFeatureISAVersion <9,0,2, |
| 573 | [FeatureGFX9, |
| Matt Arsenault | 28f52e5 | 2017-10-25 07:00:51 +0000 | [diff] [blame] | 574 | FeatureMadMixInsts, |
| 575 | FeatureLDSBankCount32 |
| 576 | ]>; |
| Wei Ding | 7c3e511 | 2017-06-10 03:53:19 +0000 | [diff] [blame] | 577 | |
| 578 | def FeatureISAVersion9_0_3 : SubtargetFeatureISAVersion <9,0,3, |
| 579 | [FeatureGFX9, |
| Matt Arsenault | 28f52e5 | 2017-10-25 07:00:51 +0000 | [diff] [blame] | 580 | FeatureMadMixInsts, |
| Wei Ding | 7c3e511 | 2017-06-10 03:53:19 +0000 | [diff] [blame] | 581 | FeatureLDSBankCount32, |
| 582 | FeatureXNACK]>; |
| Matt Arsenault | e823d92 | 2017-02-18 18:29:53 +0000 | [diff] [blame] | 583 | |
| Tom Stellard | 3498e4f | 2013-06-07 20:28:55 +0000 | [diff] [blame] | 584 | //===----------------------------------------------------------------------===// |
| Konstantin Zhuravlyov | 8c273ad | 2016-04-18 16:28:23 +0000 | [diff] [blame] | 585 | // Debugger related subtarget features. |
| 586 | //===----------------------------------------------------------------------===// |
| 587 | |
| 588 | def FeatureDebuggerInsertNops : SubtargetFeature< |
| 589 | "amdgpu-debugger-insert-nops", |
| 590 | "DebuggerInsertNops", |
| 591 | "true", |
| Konstantin Zhuravlyov | e3d322a | 2016-05-13 18:21:28 +0000 | [diff] [blame] | 592 | "Insert one nop instruction for each high level source statement" |
| Konstantin Zhuravlyov | 8c273ad | 2016-04-18 16:28:23 +0000 | [diff] [blame] | 593 | >; |
| 594 | |
| Konstantin Zhuravlyov | 29ddd2b | 2016-05-24 18:37:18 +0000 | [diff] [blame] | 595 | def FeatureDebuggerReserveRegs : SubtargetFeature< |
| 596 | "amdgpu-debugger-reserve-regs", |
| 597 | "DebuggerReserveRegs", |
| Konstantin Zhuravlyov | 1d99c4d | 2016-04-26 15:43:14 +0000 | [diff] [blame] | 598 | "true", |
| Konstantin Zhuravlyov | 29ddd2b | 2016-05-24 18:37:18 +0000 | [diff] [blame] | 599 | "Reserve registers for debugger usage" |
| Konstantin Zhuravlyov | 1d99c4d | 2016-04-26 15:43:14 +0000 | [diff] [blame] | 600 | >; |
| 601 | |
| Konstantin Zhuravlyov | f2f3d14 | 2016-06-25 03:11:28 +0000 | [diff] [blame] | 602 | def FeatureDebuggerEmitPrologue : SubtargetFeature< |
| 603 | "amdgpu-debugger-emit-prologue", |
| 604 | "DebuggerEmitPrologue", |
| 605 | "true", |
| 606 | "Emit debugger prologue" |
| 607 | >; |
| 608 | |
| Konstantin Zhuravlyov | 8c273ad | 2016-04-18 16:28:23 +0000 | [diff] [blame] | 609 | //===----------------------------------------------------------------------===// |
| Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 610 | |
| 611 | def AMDGPUInstrInfo : InstrInfo { |
| 612 | let guessInstructionProperties = 1; |
| Matt Arsenault | 1ecac06 | 2015-02-18 02:15:32 +0000 | [diff] [blame] | 613 | let noNamedPositionallyEncodedOperands = 1; |
| Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 614 | } |
| 615 | |
| Tom Stellard | 9d7ddd5 | 2014-11-14 14:08:00 +0000 | [diff] [blame] | 616 | def AMDGPUAsmParser : AsmParser { |
| 617 | // Some of the R600 registers have the same name, so this crashes. |
| 618 | // For example T0_XYZW and T0_XY both have the asm name T0. |
| 619 | let ShouldEmitMatchRegisterName = 0; |
| 620 | } |
| 621 | |
| Konstantin Zhuravlyov | da4687c | 2016-09-27 14:42:48 +0000 | [diff] [blame] | 622 | def AMDGPUAsmWriter : AsmWriter { |
| 623 | int PassSubtarget = 1; |
| 624 | } |
| 625 | |
| Sam Kolton | d63d8a7 | 2016-09-09 09:37:51 +0000 | [diff] [blame] | 626 | def AMDGPUAsmVariants { |
| 627 | string Default = "Default"; |
| 628 | int Default_ID = 0; |
| 629 | string VOP3 = "VOP3"; |
| 630 | int VOP3_ID = 1; |
| 631 | string SDWA = "SDWA"; |
| 632 | int SDWA_ID = 2; |
| Sam Kolton | f7659d71 | 2017-05-23 10:08:55 +0000 | [diff] [blame] | 633 | string SDWA9 = "SDWA9"; |
| 634 | int SDWA9_ID = 3; |
| Sam Kolton | d63d8a7 | 2016-09-09 09:37:51 +0000 | [diff] [blame] | 635 | string DPP = "DPP"; |
| Sam Kolton | f7659d71 | 2017-05-23 10:08:55 +0000 | [diff] [blame] | 636 | int DPP_ID = 4; |
| Sam Kolton | fb0d9d9 | 2016-09-12 14:42:43 +0000 | [diff] [blame] | 637 | string Disable = "Disable"; |
| Sam Kolton | f7659d71 | 2017-05-23 10:08:55 +0000 | [diff] [blame] | 638 | int Disable_ID = 5; |
| Sam Kolton | d63d8a7 | 2016-09-09 09:37:51 +0000 | [diff] [blame] | 639 | } |
| 640 | |
| 641 | def DefaultAMDGPUAsmParserVariant : AsmParserVariant { |
| 642 | let Variant = AMDGPUAsmVariants.Default_ID; |
| 643 | let Name = AMDGPUAsmVariants.Default; |
| 644 | } |
| 645 | |
| 646 | def VOP3AsmParserVariant : AsmParserVariant { |
| 647 | let Variant = AMDGPUAsmVariants.VOP3_ID; |
| 648 | let Name = AMDGPUAsmVariants.VOP3; |
| 649 | } |
| 650 | |
| 651 | def SDWAAsmParserVariant : AsmParserVariant { |
| 652 | let Variant = AMDGPUAsmVariants.SDWA_ID; |
| 653 | let Name = AMDGPUAsmVariants.SDWA; |
| 654 | } |
| 655 | |
| Sam Kolton | f7659d71 | 2017-05-23 10:08:55 +0000 | [diff] [blame] | 656 | def SDWA9AsmParserVariant : AsmParserVariant { |
| 657 | let Variant = AMDGPUAsmVariants.SDWA9_ID; |
| 658 | let Name = AMDGPUAsmVariants.SDWA9; |
| 659 | } |
| 660 | |
| 661 | |
| Sam Kolton | d63d8a7 | 2016-09-09 09:37:51 +0000 | [diff] [blame] | 662 | def DPPAsmParserVariant : AsmParserVariant { |
| 663 | let Variant = AMDGPUAsmVariants.DPP_ID; |
| 664 | let Name = AMDGPUAsmVariants.DPP; |
| 665 | } |
| 666 | |
| Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 667 | def AMDGPU : Target { |
| 668 | // Pull in Instruction Info: |
| 669 | let InstructionSet = AMDGPUInstrInfo; |
| Tom Stellard | 9d7ddd5 | 2014-11-14 14:08:00 +0000 | [diff] [blame] | 670 | let AssemblyParsers = [AMDGPUAsmParser]; |
| Sam Kolton | d63d8a7 | 2016-09-09 09:37:51 +0000 | [diff] [blame] | 671 | let AssemblyParserVariants = [DefaultAMDGPUAsmParserVariant, |
| 672 | VOP3AsmParserVariant, |
| 673 | SDWAAsmParserVariant, |
| Sam Kolton | f7659d71 | 2017-05-23 10:08:55 +0000 | [diff] [blame] | 674 | SDWA9AsmParserVariant, |
| Sam Kolton | d63d8a7 | 2016-09-09 09:37:51 +0000 | [diff] [blame] | 675 | DPPAsmParserVariant]; |
| Konstantin Zhuravlyov | da4687c | 2016-09-27 14:42:48 +0000 | [diff] [blame] | 676 | let AssemblyWriters = [AMDGPUAsmWriter]; |
| Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 677 | } |
| 678 | |
| Tom Stellard | bc5b537 | 2014-06-13 16:38:59 +0000 | [diff] [blame] | 679 | // Dummy Instruction itineraries for pseudo instructions |
| 680 | def ALU_NULL : FuncUnit; |
| 681 | def NullALU : InstrItinClass; |
| 682 | |
| Tom Stellard | 0e70de5 | 2014-05-16 20:56:45 +0000 | [diff] [blame] | 683 | //===----------------------------------------------------------------------===// |
| 684 | // Predicate helper class |
| 685 | //===----------------------------------------------------------------------===// |
| 686 | |
| Tom Stellard | d1f0f02 | 2015-04-23 19:33:54 +0000 | [diff] [blame] | 687 | def TruePredicate : Predicate<"true">; |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 688 | |
| Tom Stellard | d1f0f02 | 2015-04-23 19:33:54 +0000 | [diff] [blame] | 689 | def isSICI : Predicate< |
| 690 | "Subtarget->getGeneration() == AMDGPUSubtarget::SOUTHERN_ISLANDS ||" |
| 691 | "Subtarget->getGeneration() == AMDGPUSubtarget::SEA_ISLANDS" |
| Matt Arsenault | 8728c5f | 2017-08-07 14:58:04 +0000 | [diff] [blame] | 692 | >, AssemblerPredicate<"!FeatureGCN3Encoding">; |
| Tom Stellard | d1f0f02 | 2015-04-23 19:33:54 +0000 | [diff] [blame] | 693 | |
| Tom Stellard | 5ebdfbe | 2015-12-24 03:18:18 +0000 | [diff] [blame] | 694 | def isVI : Predicate < |
| 695 | "Subtarget->getGeneration() >= AMDGPUSubtarget::VOLCANIC_ISLANDS">, |
| 696 | AssemblerPredicate<"FeatureGCN3Encoding">; |
| 697 | |
| Matt Arsenault | 2021f08 | 2017-02-18 19:12:26 +0000 | [diff] [blame] | 698 | def isGFX9 : Predicate < |
| 699 | "Subtarget->getGeneration() >= AMDGPUSubtarget::GFX9">, |
| 700 | AssemblerPredicate<"FeatureGFX9Insts">; |
| 701 | |
| Matt Arsenault | e823d92 | 2017-02-18 18:29:53 +0000 | [diff] [blame] | 702 | // TODO: Either the name to be changed or we simply use IsCI! |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 703 | def isCIVI : Predicate < |
| Matt Arsenault | e823d92 | 2017-02-18 18:29:53 +0000 | [diff] [blame] | 704 | "Subtarget->getGeneration() >= AMDGPUSubtarget::SEA_ISLANDS">, |
| 705 | AssemblerPredicate<"FeatureCIInsts">; |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 706 | |
| Matt Arsenault | 9698f1c | 2017-06-20 19:54:14 +0000 | [diff] [blame] | 707 | def HasFlatAddressSpace : Predicate<"Subtarget->hasFlatAddressSpace()">, |
| 708 | AssemblerPredicate<"FeatureFlatAddressSpace">; |
| 709 | |
| 710 | def HasFlatGlobalInsts : Predicate<"Subtarget->hasFlatGlobalInsts()">, |
| 711 | AssemblerPredicate<"FeatureFlatGlobalInsts">; |
| Matt Arsenault | ca7b0a1 | 2017-07-21 15:36:16 +0000 | [diff] [blame] | 712 | def HasFlatScratchInsts : Predicate<"Subtarget->hasFlatScratchInsts()">, |
| 713 | AssemblerPredicate<"FeatureFlatScratchInsts">; |
| Matt Arsenault | ed6e8f0 | 2017-09-01 18:36:06 +0000 | [diff] [blame] | 714 | def HasD16LoadStore : Predicate<"Subtarget->hasD16LoadStore()">, |
| 715 | AssemblerPredicate<"FeatureGFX9Insts">; |
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 716 | |
| Matt Arsenault | efa1d65 | 2017-09-01 18:38:02 +0000 | [diff] [blame] | 717 | def HasDSAddTid : Predicate<"Subtarget->getGeneration() >= AMDGPUSubtarget::GFX9">, |
| 718 | AssemblerPredicate<"FeatureGFX9Insts">; |
| 719 | |
| Matt Arsenault | c37fe66 | 2017-07-20 17:42:47 +0000 | [diff] [blame] | 720 | def HasAddNoCarryInsts : Predicate<"Subtarget->hasAddNoCarryInsts()">, |
| 721 | AssemblerPredicate<"FeatureAddNoCarryInsts">; |
| 722 | |
| 723 | def NotHasAddNoCarryInsts : Predicate<"!Subtarget->hasAddNoCarryInsts()">, |
| 724 | AssemblerPredicate<"!FeatureAddNoCarryInsts">; |
| 725 | |
| Matt Arsenault | 9be7b0d | 2017-02-27 18:49:11 +0000 | [diff] [blame] | 726 | def Has16BitInsts : Predicate<"Subtarget->has16BitInsts()">, |
| 727 | AssemblerPredicate<"Feature16BitInsts">; |
| 728 | def HasVOP3PInsts : Predicate<"Subtarget->hasVOP3PInsts()">, |
| 729 | AssemblerPredicate<"FeatureVOP3P">; |
| Tom Stellard | 115a615 | 2016-11-10 16:02:37 +0000 | [diff] [blame] | 730 | |
| Sam Kolton | 07dbde2 | 2017-01-20 10:01:25 +0000 | [diff] [blame] | 731 | def HasSDWA : Predicate<"Subtarget->hasSDWA()">, |
| Sam Kolton | f7659d71 | 2017-05-23 10:08:55 +0000 | [diff] [blame] | 732 | AssemblerPredicate<"FeatureSDWA,FeatureVolcanicIslands">; |
| 733 | |
| 734 | def HasSDWA9 : Predicate<"Subtarget->hasSDWA()">, |
| 735 | AssemblerPredicate<"FeatureSDWA,FeatureGFX9">; |
| Sam Kolton | 07dbde2 | 2017-01-20 10:01:25 +0000 | [diff] [blame] | 736 | |
| 737 | def HasDPP : Predicate<"Subtarget->hasDPP()">, |
| 738 | AssemblerPredicate<"FeatureDPP">; |
| 739 | |
| Dmitry Preobrazhensky | ff64aa5 | 2017-08-16 13:51:56 +0000 | [diff] [blame] | 740 | def HasIntClamp : Predicate<"Subtarget->hasIntClamp()">, |
| 741 | AssemblerPredicate<"FeatureIntClamp">; |
| 742 | |
| Matt Arsenault | 28f52e5 | 2017-10-25 07:00:51 +0000 | [diff] [blame] | 743 | def HasMadMixInsts : Predicate<"Subtarget->hasMadMixInsts()">, |
| 744 | AssemblerPredicate<"FeatureMadMixInsts">; |
| Matt Arsenault | d7e2303 | 2017-09-07 18:05:07 +0000 | [diff] [blame] | 745 | |
| Matt Arsenault | cc85223 | 2017-10-10 20:22:07 +0000 | [diff] [blame] | 746 | def EnableLateCFGStructurize : Predicate< |
| 747 | "EnableLateStructurizeCFG">; |
| Matt Arsenault | 90c7593 | 2017-10-03 00:06:41 +0000 | [diff] [blame] | 748 | |
| 749 | // Exists to help track down where SubtargetPredicate isn't set rather |
| 750 | // than letting tablegen crash with an unhelpful error. |
| 751 | def InvalidPred : Predicate<"predicate not set on instruction or pattern">; |
| 752 | |
| Tom Stellard | 0e70de5 | 2014-05-16 20:56:45 +0000 | [diff] [blame] | 753 | class PredicateControl { |
| Matt Arsenault | 90c7593 | 2017-10-03 00:06:41 +0000 | [diff] [blame] | 754 | Predicate SubtargetPredicate = InvalidPred; |
| Tom Stellard | d1f0f02 | 2015-04-23 19:33:54 +0000 | [diff] [blame] | 755 | Predicate SIAssemblerPredicate = isSICI; |
| Tom Stellard | 5ebdfbe | 2015-12-24 03:18:18 +0000 | [diff] [blame] | 756 | Predicate VIAssemblerPredicate = isVI; |
| Tom Stellard | d7e6f13 | 2015-04-08 01:09:26 +0000 | [diff] [blame] | 757 | list<Predicate> AssemblerPredicates = []; |
| Tom Stellard | d1f0f02 | 2015-04-23 19:33:54 +0000 | [diff] [blame] | 758 | Predicate AssemblerPredicate = TruePredicate; |
| Tom Stellard | 0e70de5 | 2014-05-16 20:56:45 +0000 | [diff] [blame] | 759 | list<Predicate> OtherPredicates = []; |
| Matt Arsenault | 90c7593 | 2017-10-03 00:06:41 +0000 | [diff] [blame] | 760 | list<Predicate> Predicates = !listconcat([SubtargetPredicate, |
| 761 | AssemblerPredicate], |
| Tom Stellard | d7e6f13 | 2015-04-08 01:09:26 +0000 | [diff] [blame] | 762 | AssemblerPredicates, |
| Tom Stellard | 0e70de5 | 2014-05-16 20:56:45 +0000 | [diff] [blame] | 763 | OtherPredicates); |
| 764 | } |
| 765 | |
| Matt Arsenault | 90c7593 | 2017-10-03 00:06:41 +0000 | [diff] [blame] | 766 | class AMDGPUPat<dag pattern, dag result> : Pat<pattern, result>, |
| 767 | PredicateControl; |
| 768 | |
| 769 | |
| Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 770 | // Include AMDGPU TD files |
| 771 | include "R600Schedule.td" |
| Konstantin Zhuravlyov | 27b0a03 | 2017-11-10 20:01:58 +0000 | [diff] [blame^] | 772 | include "R600Processors.td" |
| Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 773 | include "SISchedule.td" |
| Konstantin Zhuravlyov | 27b0a03 | 2017-11-10 20:01:58 +0000 | [diff] [blame^] | 774 | include "GCNProcessors.td" |
| Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 775 | include "AMDGPUInstrInfo.td" |
| 776 | include "AMDGPUIntrinsics.td" |
| 777 | include "AMDGPURegisterInfo.td" |
| Tom Stellard | ca16621 | 2017-01-30 21:56:46 +0000 | [diff] [blame] | 778 | include "AMDGPURegisterBanks.td" |
| Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 779 | include "AMDGPUInstructions.td" |
| Christian Konig | 2c8f6d5 | 2013-03-07 09:03:52 +0000 | [diff] [blame] | 780 | include "AMDGPUCallingConv.td" |