| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 1 | //===-- AMDGPU.td - AMDGPU Tablegen files --------*- tablegen -*-===// | 
| Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 2 | // | 
|  | 3 | //                     The LLVM Compiler Infrastructure | 
|  | 4 | // | 
|  | 5 | // This file is distributed under the University of Illinois Open Source | 
|  | 6 | // License. See LICENSE.TXT for details. | 
|  | 7 | // | 
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 8 | //===------------------------------------------------------------===// | 
| Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 9 |  | 
| Tom Stellard | bc5b537 | 2014-06-13 16:38:59 +0000 | [diff] [blame] | 10 | include "llvm/Target/Target.td" | 
| Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 11 |  | 
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 12 | //===------------------------------------------------------------===// | 
|  | 13 | // Subtarget Features (device properties) | 
|  | 14 | //===------------------------------------------------------------===// | 
| Tom Stellard | 783893a | 2013-11-18 19:43:33 +0000 | [diff] [blame] | 15 |  | 
| Matt Arsenault | f5e2997 | 2014-06-20 06:50:05 +0000 | [diff] [blame] | 16 | def FeatureFP64 : SubtargetFeature<"fp64", | 
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 17 | "FP64", | 
|  | 18 | "true", | 
|  | 19 | "Enable double precision operations" | 
|  | 20 | >; | 
| Matt Arsenault | f171cf2 | 2014-07-14 23:40:49 +0000 | [diff] [blame] | 21 |  | 
| Jan Vesely | 39aeab4 | 2017-12-04 23:07:28 +0000 | [diff] [blame] | 22 | def FeatureFMA : SubtargetFeature<"fmaf", | 
|  | 23 | "FMA", | 
|  | 24 | "true", | 
|  | 25 | "Enable single precision FMA (not as fast as mul+add, but fused)" | 
|  | 26 | >; | 
|  | 27 |  | 
| Matt Arsenault | b035a57 | 2015-01-29 19:34:25 +0000 | [diff] [blame] | 28 | def FeatureFastFMAF32 : SubtargetFeature<"fast-fmaf", | 
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 29 | "FastFMAF32", | 
|  | 30 | "true", | 
|  | 31 | "Assuming f32 fma is at least as fast as mul + add" | 
|  | 32 | >; | 
| Matt Arsenault | b035a57 | 2015-01-29 19:34:25 +0000 | [diff] [blame] | 33 |  | 
| Dmitry Preobrazhensky | e3271ae | 2018-02-05 12:45:43 +0000 | [diff] [blame] | 34 | def FeatureMIMG_R128 : SubtargetFeature<"mimg-r128", | 
|  | 35 | "MIMG_R128", | 
|  | 36 | "true", | 
|  | 37 | "Support 128-bit texture resources" | 
|  | 38 | >; | 
|  | 39 |  | 
| Matt Arsenault | e83690c | 2016-01-18 21:13:50 +0000 | [diff] [blame] | 40 | def HalfRate64Ops : SubtargetFeature<"half-rate-64-ops", | 
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 41 | "HalfRate64Ops", | 
|  | 42 | "true", | 
|  | 43 | "Most fp64 instructions are half rate instead of quarter" | 
|  | 44 | >; | 
| Matt Arsenault | f171cf2 | 2014-07-14 23:40:49 +0000 | [diff] [blame] | 45 |  | 
| Tom Stellard | 9979277 | 2013-06-07 20:28:49 +0000 | [diff] [blame] | 46 | def FeatureR600ALUInst : SubtargetFeature<"R600ALUInst", | 
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 47 | "R600ALUInst", | 
|  | 48 | "false", | 
|  | 49 | "Older version of ALU instructions encoding" | 
|  | 50 | >; | 
| Tom Stellard | 9979277 | 2013-06-07 20:28:49 +0000 | [diff] [blame] | 51 |  | 
|  | 52 | def FeatureVertexCache : SubtargetFeature<"HasVertexCache", | 
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 53 | "HasVertexCache", | 
|  | 54 | "true", | 
|  | 55 | "Specify use of dedicated vertex cache" | 
|  | 56 | >; | 
| Tom Stellard | 9979277 | 2013-06-07 20:28:49 +0000 | [diff] [blame] | 57 |  | 
| Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 58 | def FeatureCaymanISA : SubtargetFeature<"caymanISA", | 
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 59 | "CaymanISA", | 
|  | 60 | "true", | 
|  | 61 | "Use Cayman ISA" | 
|  | 62 | >; | 
| Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 63 |  | 
| Tom Stellard | 348273d | 2014-01-23 16:18:02 +0000 | [diff] [blame] | 64 | def FeatureCFALUBug : SubtargetFeature<"cfalubug", | 
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 65 | "CFALUBug", | 
|  | 66 | "true", | 
|  | 67 | "GPU has CF_ALU bug" | 
|  | 68 | >; | 
| Changpeng Fang | b41574a | 2015-12-22 20:55:23 +0000 | [diff] [blame] | 69 |  | 
| Matt Arsenault | 3f98140 | 2014-09-15 15:41:53 +0000 | [diff] [blame] | 70 | def FeatureFlatAddressSpace : SubtargetFeature<"flat-address-space", | 
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 71 | "FlatAddressSpace", | 
|  | 72 | "true", | 
|  | 73 | "Support flat address space" | 
|  | 74 | >; | 
| Matt Arsenault | 3f98140 | 2014-09-15 15:41:53 +0000 | [diff] [blame] | 75 |  | 
| Matt Arsenault | acdc765 | 2017-05-10 21:19:05 +0000 | [diff] [blame] | 76 | def FeatureFlatInstOffsets : SubtargetFeature<"flat-inst-offsets", | 
|  | 77 | "FlatInstOffsets", | 
|  | 78 | "true", | 
|  | 79 | "Flat instructions have immediate offset addressing mode" | 
|  | 80 | >; | 
|  | 81 |  | 
|  | 82 | def FeatureFlatGlobalInsts : SubtargetFeature<"flat-global-insts", | 
|  | 83 | "FlatGlobalInsts", | 
|  | 84 | "true", | 
|  | 85 | "Have global_* flat memory instructions" | 
|  | 86 | >; | 
|  | 87 |  | 
|  | 88 | def FeatureFlatScratchInsts : SubtargetFeature<"flat-scratch-insts", | 
|  | 89 | "FlatScratchInsts", | 
|  | 90 | "true", | 
|  | 91 | "Have scratch_* flat memory instructions" | 
|  | 92 | >; | 
|  | 93 |  | 
| Matt Arsenault | c37fe66 | 2017-07-20 17:42:47 +0000 | [diff] [blame] | 94 | def FeatureAddNoCarryInsts : SubtargetFeature<"add-no-carry-insts", | 
|  | 95 | "AddNoCarryInsts", | 
|  | 96 | "true", | 
|  | 97 | "Have VALU add/sub instructions without carry out" | 
|  | 98 | >; | 
|  | 99 |  | 
| Matt Arsenault | 7f681ac | 2016-07-01 23:03:44 +0000 | [diff] [blame] | 100 | def FeatureUnalignedBufferAccess : SubtargetFeature<"unaligned-buffer-access", | 
|  | 101 | "UnalignedBufferAccess", | 
|  | 102 | "true", | 
|  | 103 | "Support unaligned global loads and stores" | 
|  | 104 | >; | 
|  | 105 |  | 
| Wei Ding | 205bfdb | 2017-02-10 02:15:29 +0000 | [diff] [blame] | 106 | def FeatureTrapHandler: SubtargetFeature<"trap-handler", | 
|  | 107 | "TrapHandler", | 
|  | 108 | "true", | 
|  | 109 | "Trap handler support" | 
|  | 110 | >; | 
|  | 111 |  | 
| Tom Stellard | 64a9d08 | 2016-10-14 18:10:39 +0000 | [diff] [blame] | 112 | def FeatureUnalignedScratchAccess : SubtargetFeature<"unaligned-scratch-access", | 
|  | 113 | "UnalignedScratchAccess", | 
|  | 114 | "true", | 
|  | 115 | "Support unaligned scratch loads and stores" | 
|  | 116 | >; | 
|  | 117 |  | 
| Matt Arsenault | e823d92 | 2017-02-18 18:29:53 +0000 | [diff] [blame] | 118 | def FeatureApertureRegs : SubtargetFeature<"aperture-regs", | 
|  | 119 | "HasApertureRegs", | 
|  | 120 | "true", | 
|  | 121 | "Has Memory Aperture Base and Size Registers" | 
|  | 122 | >; | 
|  | 123 |  | 
| Matt Arsenault | 28f52e5 | 2017-10-25 07:00:51 +0000 | [diff] [blame] | 124 | def FeatureMadMixInsts : SubtargetFeature<"mad-mix-insts", | 
|  | 125 | "HasMadMixInsts", | 
|  | 126 | "true", | 
|  | 127 | "Has v_mad_mix_f32, v_mad_mixlo_f16, v_mad_mixhi_f16 instructions" | 
|  | 128 | >; | 
|  | 129 |  | 
| Matt Arsenault | 0084adc | 2018-04-30 19:08:16 +0000 | [diff] [blame] | 130 | def FeatureFmaMixInsts : SubtargetFeature<"fma-mix-insts", | 
|  | 131 | "HasFmaMixInsts", | 
|  | 132 | "true", | 
|  | 133 | "Has v_fma_mix_f32, v_fma_mixlo_f16, v_fma_mixhi_f16 instructions" | 
|  | 134 | >; | 
|  | 135 |  | 
| Marek Olsak | 0f55fba | 2016-12-09 19:49:54 +0000 | [diff] [blame] | 136 | // XNACK is disabled if SH_MEM_CONFIG.ADDRESS_MODE = GPUVM on chips that support | 
|  | 137 | // XNACK. The current default kernel driver setting is: | 
|  | 138 | // - graphics ring: XNACK disabled | 
|  | 139 | // - compute ring: XNACK enabled | 
|  | 140 | // | 
|  | 141 | // If XNACK is enabled, the VMEM latency can be worse. | 
|  | 142 | // If XNACK is disabled, the 2 SGPRs can be used for general purposes. | 
| Nicolai Haehnle | 5b50497 | 2016-01-04 23:35:53 +0000 | [diff] [blame] | 143 | def FeatureXNACK : SubtargetFeature<"xnack", | 
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 144 | "EnableXNACK", | 
|  | 145 | "true", | 
|  | 146 | "Enable XNACK support" | 
|  | 147 | >; | 
| Tom Stellard | e99fb65 | 2015-01-20 19:33:04 +0000 | [diff] [blame] | 148 |  | 
| Marek Olsak | 4d00dd2 | 2015-03-09 15:48:09 +0000 | [diff] [blame] | 149 | def FeatureSGPRInitBug : SubtargetFeature<"sgpr-init-bug", | 
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 150 | "SGPRInitBug", | 
|  | 151 | "true", | 
| Matt Arsenault | a7eb14af | 2017-08-06 18:13:23 +0000 | [diff] [blame] | 152 | "VI SGPR initialization bug requiring a fixed SGPR allocation size" | 
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 153 | >; | 
| Tom Stellard | de008d3 | 2016-01-21 04:28:34 +0000 | [diff] [blame] | 154 |  | 
| Tom Stellard | 3498e4f | 2013-06-07 20:28:55 +0000 | [diff] [blame] | 155 | class SubtargetFeatureFetchLimit <string Value> : | 
|  | 156 | SubtargetFeature <"fetch"#Value, | 
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 157 | "TexVTXClauseSize", | 
|  | 158 | Value, | 
|  | 159 | "Limit the maximum number of fetches in a clause to "#Value | 
|  | 160 | >; | 
| Tom Stellard | 9979277 | 2013-06-07 20:28:49 +0000 | [diff] [blame] | 161 |  | 
| Tom Stellard | 3498e4f | 2013-06-07 20:28:55 +0000 | [diff] [blame] | 162 | def FeatureFetchLimit8 : SubtargetFeatureFetchLimit <"8">; | 
|  | 163 | def FeatureFetchLimit16 : SubtargetFeatureFetchLimit <"16">; | 
|  | 164 |  | 
| Tom Stellard | 8c347b0 | 2014-01-22 21:55:40 +0000 | [diff] [blame] | 165 | class SubtargetFeatureWavefrontSize <int Value> : SubtargetFeature< | 
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 166 | "wavefrontsize"#Value, | 
|  | 167 | "WavefrontSize", | 
|  | 168 | !cast<string>(Value), | 
|  | 169 | "The number of threads per wavefront" | 
|  | 170 | >; | 
| Tom Stellard | 8c347b0 | 2014-01-22 21:55:40 +0000 | [diff] [blame] | 171 |  | 
|  | 172 | def FeatureWavefrontSize16 : SubtargetFeatureWavefrontSize<16>; | 
|  | 173 | def FeatureWavefrontSize32 : SubtargetFeatureWavefrontSize<32>; | 
|  | 174 | def FeatureWavefrontSize64 : SubtargetFeatureWavefrontSize<64>; | 
|  | 175 |  | 
| Tom Stellard | ec87f84 | 2015-05-25 16:15:54 +0000 | [diff] [blame] | 176 | class SubtargetFeatureLDSBankCount <int Value> : SubtargetFeature < | 
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 177 | "ldsbankcount"#Value, | 
|  | 178 | "LDSBankCount", | 
|  | 179 | !cast<string>(Value), | 
|  | 180 | "The number of LDS banks per compute unit." | 
|  | 181 | >; | 
| Tom Stellard | ec87f84 | 2015-05-25 16:15:54 +0000 | [diff] [blame] | 182 |  | 
|  | 183 | def FeatureLDSBankCount16 : SubtargetFeatureLDSBankCount<16>; | 
|  | 184 | def FeatureLDSBankCount32 : SubtargetFeatureLDSBankCount<32>; | 
|  | 185 |  | 
| Tom Stellard | 880a80a | 2014-06-17 16:53:14 +0000 | [diff] [blame] | 186 | class SubtargetFeatureLocalMemorySize <int Value> : SubtargetFeature< | 
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 187 | "localmemorysize"#Value, | 
|  | 188 | "LocalMemorySize", | 
|  | 189 | !cast<string>(Value), | 
|  | 190 | "The size of local memory in bytes" | 
|  | 191 | >; | 
| Tom Stellard | 880a80a | 2014-06-17 16:53:14 +0000 | [diff] [blame] | 192 |  | 
| Tom Stellard | d7e6f13 | 2015-04-08 01:09:26 +0000 | [diff] [blame] | 193 | def FeatureGCN : SubtargetFeature<"gcn", | 
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 194 | "IsGCN", | 
|  | 195 | "true", | 
|  | 196 | "GCN or newer GPU" | 
|  | 197 | >; | 
| Tom Stellard | d7e6f13 | 2015-04-08 01:09:26 +0000 | [diff] [blame] | 198 |  | 
| Tom Stellard | d7e6f13 | 2015-04-08 01:09:26 +0000 | [diff] [blame] | 199 | def FeatureGCN3Encoding : SubtargetFeature<"gcn3-encoding", | 
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 200 | "GCN3Encoding", | 
|  | 201 | "true", | 
|  | 202 | "Encoding format for VI" | 
|  | 203 | >; | 
| Tom Stellard | d1f0f02 | 2015-04-23 19:33:54 +0000 | [diff] [blame] | 204 |  | 
|  | 205 | def FeatureCIInsts : SubtargetFeature<"ci-insts", | 
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 206 | "CIInsts", | 
|  | 207 | "true", | 
| Matt Arsenault | c6baa85 | 2017-10-02 20:31:18 +0000 | [diff] [blame] | 208 | "Additional instructions for CI+" | 
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 209 | >; | 
|  | 210 |  | 
| Matt Arsenault | 2021f08 | 2017-02-18 19:12:26 +0000 | [diff] [blame] | 211 | def FeatureGFX9Insts : SubtargetFeature<"gfx9-insts", | 
|  | 212 | "GFX9Insts", | 
|  | 213 | "true", | 
| Matt Arsenault | c6baa85 | 2017-10-02 20:31:18 +0000 | [diff] [blame] | 214 | "Additional instructions for GFX9+" | 
| Matt Arsenault | 2021f08 | 2017-02-18 19:12:26 +0000 | [diff] [blame] | 215 | >; | 
|  | 216 |  | 
| Matt Arsenault | 9d82ee7 | 2016-02-27 08:53:55 +0000 | [diff] [blame] | 217 | def FeatureSMemRealTime : SubtargetFeature<"s-memrealtime", | 
|  | 218 | "HasSMemRealTime", | 
| Matt Arsenault | 61738cb | 2016-02-27 08:53:46 +0000 | [diff] [blame] | 219 | "true", | 
| Matt Arsenault | 9d82ee7 | 2016-02-27 08:53:55 +0000 | [diff] [blame] | 220 | "Has s_memrealtime instruction" | 
|  | 221 | >; | 
|  | 222 |  | 
| Matt Arsenault | c88ba36 | 2016-10-29 04:05:06 +0000 | [diff] [blame] | 223 | def FeatureInv2PiInlineImm : SubtargetFeature<"inv-2pi-inline-imm", | 
|  | 224 | "HasInv2PiInlineImm", | 
|  | 225 | "true", | 
|  | 226 | "Has 1 / (2 * pi) as inline immediate" | 
|  | 227 | >; | 
|  | 228 |  | 
| Matt Arsenault | 9d82ee7 | 2016-02-27 08:53:55 +0000 | [diff] [blame] | 229 | def Feature16BitInsts : SubtargetFeature<"16-bit-insts", | 
|  | 230 | "Has16BitInsts", | 
|  | 231 | "true", | 
|  | 232 | "Has i16/f16 instructions" | 
| Matt Arsenault | 61738cb | 2016-02-27 08:53:46 +0000 | [diff] [blame] | 233 | >; | 
|  | 234 |  | 
| Matt Arsenault | 9be7b0d | 2017-02-27 18:49:11 +0000 | [diff] [blame] | 235 | def FeatureVOP3P : SubtargetFeature<"vop3p", | 
|  | 236 | "HasVOP3PInsts", | 
|  | 237 | "true", | 
|  | 238 | "Has VOP3P packed instructions" | 
|  | 239 | >; | 
|  | 240 |  | 
| Matt Arsenault | cc88ce3 | 2016-10-12 18:00:51 +0000 | [diff] [blame] | 241 | def FeatureMovrel : SubtargetFeature<"movrel", | 
|  | 242 | "HasMovrel", | 
|  | 243 | "true", | 
|  | 244 | "Has v_movrel*_b32 instructions" | 
|  | 245 | >; | 
|  | 246 |  | 
|  | 247 | def FeatureVGPRIndexMode : SubtargetFeature<"vgpr-index-mode", | 
|  | 248 | "HasVGPRIndexMode", | 
|  | 249 | "true", | 
|  | 250 | "Has VGPR mode register indexing" | 
|  | 251 | >; | 
|  | 252 |  | 
| Matt Arsenault | 7b64755 | 2016-10-28 21:55:15 +0000 | [diff] [blame] | 253 | def FeatureScalarStores : SubtargetFeature<"scalar-stores", | 
|  | 254 | "HasScalarStores", | 
|  | 255 | "true", | 
|  | 256 | "Has store scalar memory instructions" | 
|  | 257 | >; | 
|  | 258 |  | 
| Dmitry Preobrazhensky | 6bad04e | 2018-04-02 16:10:25 +0000 | [diff] [blame] | 259 | def FeatureScalarAtomics : SubtargetFeature<"scalar-atomics", | 
|  | 260 | "HasScalarAtomics", | 
|  | 261 | "true", | 
|  | 262 | "Has atomic scalar memory instructions" | 
|  | 263 | >; | 
|  | 264 |  | 
| Sam Kolton | 07dbde2 | 2017-01-20 10:01:25 +0000 | [diff] [blame] | 265 | def FeatureSDWA : SubtargetFeature<"sdwa", | 
|  | 266 | "HasSDWA", | 
|  | 267 | "true", | 
|  | 268 | "Support SDWA (Sub-DWORD Addressing) extension" | 
|  | 269 | >; | 
|  | 270 |  | 
| Sam Kolton | 3c4933f | 2017-06-22 06:26:41 +0000 | [diff] [blame] | 271 | def FeatureSDWAOmod : SubtargetFeature<"sdwa-omod", | 
|  | 272 | "HasSDWAOmod", | 
|  | 273 | "true", | 
|  | 274 | "Support OMod with SDWA (Sub-DWORD Addressing) extension" | 
|  | 275 | >; | 
|  | 276 |  | 
|  | 277 | def FeatureSDWAScalar : SubtargetFeature<"sdwa-scalar", | 
|  | 278 | "HasSDWAScalar", | 
|  | 279 | "true", | 
|  | 280 | "Support scalar register with SDWA (Sub-DWORD Addressing) extension" | 
|  | 281 | >; | 
|  | 282 |  | 
|  | 283 | def FeatureSDWASdst : SubtargetFeature<"sdwa-sdst", | 
|  | 284 | "HasSDWASdst", | 
|  | 285 | "true", | 
|  | 286 | "Support scalar dst for VOPC with SDWA (Sub-DWORD Addressing) extension" | 
|  | 287 | >; | 
|  | 288 |  | 
|  | 289 | def FeatureSDWAMac : SubtargetFeature<"sdwa-mav", | 
|  | 290 | "HasSDWAMac", | 
|  | 291 | "true", | 
|  | 292 | "Support v_mac_f32/f16 with SDWA (Sub-DWORD Addressing) extension" | 
|  | 293 | >; | 
|  | 294 |  | 
| Sam Kolton | a179d25 | 2017-06-27 15:02:23 +0000 | [diff] [blame] | 295 | def FeatureSDWAOutModsVOPC : SubtargetFeature<"sdwa-out-mods-vopc", | 
|  | 296 | "HasSDWAOutModsVOPC", | 
| Sam Kolton | 3c4933f | 2017-06-22 06:26:41 +0000 | [diff] [blame] | 297 | "true", | 
|  | 298 | "Support clamp for VOPC with SDWA (Sub-DWORD Addressing) extension" | 
|  | 299 | >; | 
|  | 300 |  | 
| Sam Kolton | 07dbde2 | 2017-01-20 10:01:25 +0000 | [diff] [blame] | 301 | def FeatureDPP : SubtargetFeature<"dpp", | 
|  | 302 | "HasDPP", | 
|  | 303 | "true", | 
|  | 304 | "Support DPP (Data Parallel Primitives) extension" | 
|  | 305 | >; | 
|  | 306 |  | 
| Dmitry Preobrazhensky | ff64aa5 | 2017-08-16 13:51:56 +0000 | [diff] [blame] | 307 | def FeatureIntClamp : SubtargetFeature<"int-clamp-insts", | 
|  | 308 | "HasIntClamp", | 
|  | 309 | "true", | 
|  | 310 | "Support clamp for integer destination" | 
|  | 311 | >; | 
|  | 312 |  | 
| Changpeng Fang | 44dfa1d | 2018-01-12 21:12:19 +0000 | [diff] [blame] | 313 | def FeatureUnpackedD16VMem : SubtargetFeature<"unpacked-d16-vmem", | 
|  | 314 | "HasUnpackedD16VMem", | 
|  | 315 | "true", | 
|  | 316 | "Has unpacked d16 vmem instructions" | 
|  | 317 | >; | 
|  | 318 |  | 
| Matt Arsenault | 0084adc | 2018-04-30 19:08:16 +0000 | [diff] [blame] | 319 | def FeatureDLInsts : SubtargetFeature<"dl-insts", | 
|  | 320 | "HasDLInsts", | 
|  | 321 | "true", | 
|  | 322 | "Has deep learning instructions" | 
|  | 323 | >; | 
|  | 324 |  | 
| Konstantin Zhuravlyov | c2c2eb7 | 2018-05-04 20:06:57 +0000 | [diff] [blame] | 325 | def FeatureD16PreservesUnusedBits : SubtargetFeature< | 
|  | 326 | "d16-preserves-unused-bits", | 
|  | 327 | "D16PreservesUnusedBits", | 
|  | 328 | "true", | 
|  | 329 | "D16 memory instructions preserve unused bits rather than zeroing them out" | 
|  | 330 | >; | 
|  | 331 |  | 
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 332 | //===------------------------------------------------------------===// | 
|  | 333 | // Subtarget Features (options and debugging) | 
|  | 334 | //===------------------------------------------------------------===// | 
|  | 335 |  | 
|  | 336 | // Some instructions do not support denormals despite this flag. Using | 
|  | 337 | // fp32 denormals also causes instructions to run at the double | 
|  | 338 | // precision rate for the device. | 
|  | 339 | def FeatureFP32Denormals : SubtargetFeature<"fp32-denormals", | 
|  | 340 | "FP32Denormals", | 
|  | 341 | "true", | 
|  | 342 | "Enable single precision denormal handling" | 
|  | 343 | >; | 
|  | 344 |  | 
| Matt Arsenault | a6867fd | 2017-01-23 22:31:03 +0000 | [diff] [blame] | 345 | // Denormal handling for fp64 and fp16 is controlled by the same | 
|  | 346 | // config register when fp16 supported. | 
|  | 347 | // TODO: Do we need a separate f16 setting when not legal? | 
|  | 348 | def FeatureFP64FP16Denormals : SubtargetFeature<"fp64-fp16-denormals", | 
|  | 349 | "FP64FP16Denormals", | 
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 350 | "true", | 
| Matt Arsenault | a6867fd | 2017-01-23 22:31:03 +0000 | [diff] [blame] | 351 | "Enable double and half precision denormal handling", | 
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 352 | [FeatureFP64] | 
|  | 353 | >; | 
|  | 354 |  | 
| Matt Arsenault | a6867fd | 2017-01-23 22:31:03 +0000 | [diff] [blame] | 355 | def FeatureFP64Denormals : SubtargetFeature<"fp64-denormals", | 
|  | 356 | "FP64FP16Denormals", | 
|  | 357 | "true", | 
|  | 358 | "Enable double and half precision denormal handling", | 
|  | 359 | [FeatureFP64, FeatureFP64FP16Denormals] | 
|  | 360 | >; | 
|  | 361 |  | 
|  | 362 | def FeatureFP16Denormals : SubtargetFeature<"fp16-denormals", | 
|  | 363 | "FP64FP16Denormals", | 
|  | 364 | "true", | 
|  | 365 | "Enable half precision denormal handling", | 
|  | 366 | [FeatureFP64FP16Denormals] | 
|  | 367 | >; | 
|  | 368 |  | 
| Matt Arsenault | 2fdf2a1 | 2017-02-21 23:35:48 +0000 | [diff] [blame] | 369 | def FeatureDX10Clamp : SubtargetFeature<"dx10-clamp", | 
|  | 370 | "DX10Clamp", | 
|  | 371 | "true", | 
|  | 372 | "clamp modifier clamps NaNs to 0.0" | 
|  | 373 | >; | 
|  | 374 |  | 
| Matt Arsenault | f639c32 | 2016-01-28 20:53:42 +0000 | [diff] [blame] | 375 | def FeatureFPExceptions : SubtargetFeature<"fp-exceptions", | 
|  | 376 | "FPExceptions", | 
|  | 377 | "true", | 
|  | 378 | "Enable floating point exceptions" | 
|  | 379 | >; | 
|  | 380 |  | 
| Matt Arsenault | 24ee078 | 2016-02-12 02:40:47 +0000 | [diff] [blame] | 381 | class FeatureMaxPrivateElementSize<int size> : SubtargetFeature< | 
|  | 382 | "max-private-element-size-"#size, | 
|  | 383 | "MaxPrivateElementSize", | 
|  | 384 | !cast<string>(size), | 
|  | 385 | "Maximum private access size may be "#size | 
|  | 386 | >; | 
|  | 387 |  | 
|  | 388 | def FeatureMaxPrivateElementSize4 : FeatureMaxPrivateElementSize<4>; | 
|  | 389 | def FeatureMaxPrivateElementSize8 : FeatureMaxPrivateElementSize<8>; | 
|  | 390 | def FeatureMaxPrivateElementSize16 : FeatureMaxPrivateElementSize<16>; | 
|  | 391 |  | 
| Matt Arsenault | 45b9818 | 2017-11-15 00:45:43 +0000 | [diff] [blame] | 392 | def FeatureEnableHugePrivateBuffer : SubtargetFeature< | 
|  | 393 | "huge-private-buffer", | 
|  | 394 | "EnableHugePrivateBuffer", | 
|  | 395 | "true", | 
|  | 396 | "Enable private/scratch buffer sizes greater than 128 GB" | 
|  | 397 | >; | 
|  | 398 |  | 
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 399 | def FeatureVGPRSpilling : SubtargetFeature<"vgpr-spilling", | 
|  | 400 | "EnableVGPRSpilling", | 
|  | 401 | "true", | 
|  | 402 | "Enable spilling of VGPRs to scratch memory" | 
|  | 403 | >; | 
|  | 404 |  | 
|  | 405 | def FeatureDumpCode : SubtargetFeature <"DumpCode", | 
|  | 406 | "DumpCode", | 
|  | 407 | "true", | 
|  | 408 | "Dump MachineInstrs in the CodeEmitter" | 
|  | 409 | >; | 
|  | 410 |  | 
|  | 411 | def FeatureDumpCodeLower : SubtargetFeature <"dumpcode", | 
|  | 412 | "DumpCode", | 
|  | 413 | "true", | 
|  | 414 | "Dump MachineInstrs in the CodeEmitter" | 
|  | 415 | >; | 
|  | 416 |  | 
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 417 | def FeaturePromoteAlloca : SubtargetFeature <"promote-alloca", | 
|  | 418 | "EnablePromoteAlloca", | 
|  | 419 | "true", | 
|  | 420 | "Enable promote alloca pass" | 
|  | 421 | >; | 
|  | 422 |  | 
|  | 423 | // XXX - This should probably be removed once enabled by default | 
|  | 424 | def FeatureEnableLoadStoreOpt : SubtargetFeature <"load-store-opt", | 
|  | 425 | "EnableLoadStoreOpt", | 
|  | 426 | "true", | 
|  | 427 | "Enable SI load/store optimizer pass" | 
|  | 428 | >; | 
|  | 429 |  | 
|  | 430 | // Performance debugging feature. Allow using DS instruction immediate | 
|  | 431 | // offsets even if the base pointer can't be proven to be base. On SI, | 
|  | 432 | // base pointer values that won't give the same result as a 16-bit add | 
|  | 433 | // are not safe to fold, but this will override the conservative test | 
|  | 434 | // for the base pointer. | 
|  | 435 | def FeatureEnableUnsafeDSOffsetFolding : SubtargetFeature < | 
|  | 436 | "unsafe-ds-offset-folding", | 
|  | 437 | "EnableUnsafeDSOffsetFolding", | 
|  | 438 | "true", | 
|  | 439 | "Force using DS instruction immediate offsets on SI" | 
|  | 440 | >; | 
|  | 441 |  | 
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 442 | def FeatureEnableSIScheduler : SubtargetFeature<"si-scheduler", | 
|  | 443 | "EnableSIScheduler", | 
|  | 444 | "true", | 
|  | 445 | "Enable SI Machine Scheduler" | 
|  | 446 | >; | 
|  | 447 |  | 
| Marek Olsak | a9a58fa | 2018-04-10 22:48:23 +0000 | [diff] [blame] | 448 | def FeatureEnableDS128 : SubtargetFeature<"enable-ds128", | 
|  | 449 | "EnableDS128", | 
|  | 450 | "true", | 
|  | 451 | "Use ds_{read|write}_b128" | 
|  | 452 | >; | 
|  | 453 |  | 
| Matt Arsenault | 7aad8fd | 2017-01-24 22:02:15 +0000 | [diff] [blame] | 454 | // Unless +-flat-for-global is specified, turn on FlatForGlobal for | 
|  | 455 | // all OS-es on VI and newer hardware to avoid assertion failures due | 
|  | 456 | // to missing ADDR64 variants of MUBUF instructions. | 
|  | 457 | // FIXME: moveToVALU should be able to handle converting addr64 MUBUF | 
|  | 458 | // instructions. | 
|  | 459 |  | 
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 460 | def FeatureFlatForGlobal : SubtargetFeature<"flat-for-global", | 
|  | 461 | "FlatForGlobal", | 
|  | 462 | "true", | 
| Matt Arsenault | d8f7ea3 | 2017-01-27 17:42:26 +0000 | [diff] [blame] | 463 | "Force to generate flat instruction for global" | 
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 464 | >; | 
| Tom Stellard | d1f0f02 | 2015-04-23 19:33:54 +0000 | [diff] [blame] | 465 |  | 
| Konstantin Zhuravlyov | be6c0ca | 2017-06-02 17:40:26 +0000 | [diff] [blame] | 466 | def FeatureAutoWaitcntBeforeBarrier : SubtargetFeature < | 
|  | 467 | "auto-waitcnt-before-barrier", | 
|  | 468 | "AutoWaitcntBeforeBarrier", | 
|  | 469 | "true", | 
|  | 470 | "Hardware automatically inserts waitcnt before barrier" | 
|  | 471 | >; | 
|  | 472 |  | 
| Konstantin Zhuravlyov | eda425e | 2017-10-14 15:59:07 +0000 | [diff] [blame] | 473 | def FeatureCodeObjectV3 : SubtargetFeature < | 
|  | 474 | "code-object-v3", | 
|  | 475 | "CodeObjectV3", | 
|  | 476 | "true", | 
|  | 477 | "Generate code object version 3" | 
|  | 478 | >; | 
|  | 479 |  | 
| Tom Stellard | d1f0f02 | 2015-04-23 19:33:54 +0000 | [diff] [blame] | 480 | // Dummy feature used to disable assembler instructions. | 
|  | 481 | def FeatureDisable : SubtargetFeature<"", | 
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 482 | "FeatureDisable","true", | 
|  | 483 | "Dummy feature to disable assembler instructions" | 
|  | 484 | >; | 
| Tom Stellard | d1f0f02 | 2015-04-23 19:33:54 +0000 | [diff] [blame] | 485 |  | 
| Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 486 | class SubtargetFeatureGeneration <string Value, | 
|  | 487 | list<SubtargetFeature> Implies> : | 
|  | 488 | SubtargetFeature <Value, "Gen", "AMDGPUSubtarget::"#Value, | 
|  | 489 | Value#" GPU generation", Implies>; | 
|  | 490 |  | 
| Tom Stellard | 880a80a | 2014-06-17 16:53:14 +0000 | [diff] [blame] | 491 | def FeatureLocalMemorySize0 : SubtargetFeatureLocalMemorySize<0>; | 
|  | 492 | def FeatureLocalMemorySize32768 : SubtargetFeatureLocalMemorySize<32768>; | 
|  | 493 | def FeatureLocalMemorySize65536 : SubtargetFeatureLocalMemorySize<65536>; | 
|  | 494 |  | 
| Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 495 | def FeatureR600 : SubtargetFeatureGeneration<"R600", | 
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 496 | [FeatureR600ALUInst, FeatureFetchLimit8, FeatureLocalMemorySize0] | 
|  | 497 | >; | 
| Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 498 |  | 
|  | 499 | def FeatureR700 : SubtargetFeatureGeneration<"R700", | 
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 500 | [FeatureFetchLimit16, FeatureLocalMemorySize0] | 
|  | 501 | >; | 
| Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 502 |  | 
|  | 503 | def FeatureEvergreen : SubtargetFeatureGeneration<"EVERGREEN", | 
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 504 | [FeatureFetchLimit16, FeatureLocalMemorySize32768] | 
|  | 505 | >; | 
| Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 506 |  | 
|  | 507 | def FeatureNorthernIslands : SubtargetFeatureGeneration<"NORTHERN_ISLANDS", | 
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 508 | [FeatureFetchLimit16, FeatureWavefrontSize64, | 
|  | 509 | FeatureLocalMemorySize32768] | 
| Tom Stellard | 880a80a | 2014-06-17 16:53:14 +0000 | [diff] [blame] | 510 | >; | 
| Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 511 |  | 
|  | 512 | def FeatureSouthernIslands : SubtargetFeatureGeneration<"SOUTHERN_ISLANDS", | 
| Dmitry Preobrazhensky | e3271ae | 2018-02-05 12:45:43 +0000 | [diff] [blame] | 513 | [FeatureFP64, FeatureLocalMemorySize32768, FeatureMIMG_R128, | 
| Matt Arsenault | 8728c5f | 2017-08-07 14:58:04 +0000 | [diff] [blame] | 514 | FeatureWavefrontSize64, FeatureGCN, | 
| Matt Arsenault | cc88ce3 | 2016-10-12 18:00:51 +0000 | [diff] [blame] | 515 | FeatureLDSBankCount32, FeatureMovrel] | 
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 516 | >; | 
| Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 517 |  | 
| Tom Stellard | 6e1ee47 | 2013-10-29 16:37:28 +0000 | [diff] [blame] | 518 | def FeatureSeaIslands : SubtargetFeatureGeneration<"SEA_ISLANDS", | 
| Dmitry Preobrazhensky | e3271ae | 2018-02-05 12:45:43 +0000 | [diff] [blame] | 519 | [FeatureFP64, FeatureLocalMemorySize65536, FeatureMIMG_R128, | 
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 520 | FeatureWavefrontSize64, FeatureGCN, FeatureFlatAddressSpace, | 
| Matt Arsenault | 8728c5f | 2017-08-07 14:58:04 +0000 | [diff] [blame] | 521 | FeatureCIInsts, FeatureMovrel] | 
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 522 | >; | 
| Marek Olsak | 5df00d6 | 2014-12-07 12:18:57 +0000 | [diff] [blame] | 523 |  | 
|  | 524 | def FeatureVolcanicIslands : SubtargetFeatureGeneration<"VOLCANIC_ISLANDS", | 
| Dmitry Preobrazhensky | e3271ae | 2018-02-05 12:45:43 +0000 | [diff] [blame] | 525 | [FeatureFP64, FeatureLocalMemorySize65536, FeatureMIMG_R128, | 
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 526 | FeatureWavefrontSize64, FeatureFlatAddressSpace, FeatureGCN, | 
| Matt Arsenault | 9d82ee7 | 2016-02-27 08:53:55 +0000 | [diff] [blame] | 527 | FeatureGCN3Encoding, FeatureCIInsts, Feature16BitInsts, | 
| Matt Arsenault | 7b64755 | 2016-10-28 21:55:15 +0000 | [diff] [blame] | 528 | FeatureSMemRealTime, FeatureVGPRIndexMode, FeatureMovrel, | 
| Sam Kolton | 3c4933f | 2017-06-22 06:26:41 +0000 | [diff] [blame] | 529 | FeatureScalarStores, FeatureInv2PiInlineImm, | 
| Dmitry Preobrazhensky | ff64aa5 | 2017-08-16 13:51:56 +0000 | [diff] [blame] | 530 | FeatureSDWA, FeatureSDWAOutModsVOPC, FeatureSDWAMac, FeatureDPP, | 
|  | 531 | FeatureIntClamp | 
| Matt Arsenault | 9d82ee7 | 2016-02-27 08:53:55 +0000 | [diff] [blame] | 532 | ] | 
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 533 | >; | 
| Marek Olsak | 5df00d6 | 2014-12-07 12:18:57 +0000 | [diff] [blame] | 534 |  | 
| Matt Arsenault | e823d92 | 2017-02-18 18:29:53 +0000 | [diff] [blame] | 535 | def FeatureGFX9 : SubtargetFeatureGeneration<"GFX9", | 
|  | 536 | [FeatureFP64, FeatureLocalMemorySize65536, | 
|  | 537 | FeatureWavefrontSize64, FeatureFlatAddressSpace, FeatureGCN, | 
|  | 538 | FeatureGCN3Encoding, FeatureCIInsts, Feature16BitInsts, | 
|  | 539 | FeatureSMemRealTime, FeatureScalarStores, FeatureInv2PiInlineImm, | 
| Konstantin Zhuravlyov | f628406 | 2017-04-21 19:57:53 +0000 | [diff] [blame] | 540 | FeatureApertureRegs, FeatureGFX9Insts, FeatureVOP3P, FeatureVGPRIndexMode, | 
| Dmitry Preobrazhensky | ff64aa5 | 2017-08-16 13:51:56 +0000 | [diff] [blame] | 541 | FeatureFastFMAF32, FeatureDPP, FeatureIntClamp, | 
| Sam Kolton | 3c4933f | 2017-06-22 06:26:41 +0000 | [diff] [blame] | 542 | FeatureSDWA, FeatureSDWAOmod, FeatureSDWAScalar, FeatureSDWASdst, | 
| Matt Arsenault | c37fe66 | 2017-07-20 17:42:47 +0000 | [diff] [blame] | 543 | FeatureFlatInstOffsets, FeatureFlatGlobalInsts, FeatureFlatScratchInsts, | 
| Dmitry Preobrazhensky | 6bad04e | 2018-04-02 16:10:25 +0000 | [diff] [blame] | 544 | FeatureAddNoCarryInsts, FeatureScalarAtomics | 
| Matt Arsenault | e823d92 | 2017-02-18 18:29:53 +0000 | [diff] [blame] | 545 | ] | 
|  | 546 | >; | 
|  | 547 |  | 
| Yaxun Liu | 94add85 | 2016-10-26 16:37:56 +0000 | [diff] [blame] | 548 | class SubtargetFeatureISAVersion <int Major, int Minor, int Stepping, | 
|  | 549 | list<SubtargetFeature> Implies> | 
|  | 550 | : SubtargetFeature < | 
|  | 551 | "isaver"#Major#"."#Minor#"."#Stepping, | 
|  | 552 | "IsaVersion", | 
|  | 553 | "ISAVersion"#Major#"_"#Minor#"_"#Stepping, | 
|  | 554 | "Instruction set version number", | 
|  | 555 | Implies | 
|  | 556 | >; | 
|  | 557 |  | 
| Wei Ding | 7c3e511 | 2017-06-10 03:53:19 +0000 | [diff] [blame] | 558 | def FeatureISAVersion6_0_0 : SubtargetFeatureISAVersion <6,0,0, | 
|  | 559 | [FeatureSouthernIslands, | 
| Matt Arsenault | 8bcf2f2 | 2017-06-26 03:01:36 +0000 | [diff] [blame] | 560 | FeatureFastFMAF32, | 
| Wei Ding | 7c3e511 | 2017-06-10 03:53:19 +0000 | [diff] [blame] | 561 | HalfRate64Ops, | 
|  | 562 | FeatureLDSBankCount32]>; | 
|  | 563 |  | 
|  | 564 | def FeatureISAVersion6_0_1 : SubtargetFeatureISAVersion <6,0,1, | 
|  | 565 | [FeatureSouthernIslands, | 
|  | 566 | FeatureLDSBankCount32]>; | 
| Matt Arsenault | 8bcf2f2 | 2017-06-26 03:01:36 +0000 | [diff] [blame] | 567 |  | 
| Matt Arsenault | f3dd863 | 2016-11-01 00:55:14 +0000 | [diff] [blame] | 568 | def FeatureISAVersion7_0_0 : SubtargetFeatureISAVersion <7,0,0, | 
| Yaxun Liu | 94add85 | 2016-10-26 16:37:56 +0000 | [diff] [blame] | 569 | [FeatureSeaIslands, | 
|  | 570 | FeatureLDSBankCount32]>; | 
| Matt Arsenault | f3dd863 | 2016-11-01 00:55:14 +0000 | [diff] [blame] | 571 |  | 
| Yaxun Liu | 94add85 | 2016-10-26 16:37:56 +0000 | [diff] [blame] | 572 | def FeatureISAVersion7_0_1 : SubtargetFeatureISAVersion <7,0,1, | 
|  | 573 | [FeatureSeaIslands, | 
|  | 574 | HalfRate64Ops, | 
|  | 575 | FeatureLDSBankCount32, | 
|  | 576 | FeatureFastFMAF32]>; | 
| Matt Arsenault | f3dd863 | 2016-11-01 00:55:14 +0000 | [diff] [blame] | 577 |  | 
| Yaxun Liu | 94add85 | 2016-10-26 16:37:56 +0000 | [diff] [blame] | 578 | def FeatureISAVersion7_0_2 : SubtargetFeatureISAVersion <7,0,2, | 
|  | 579 | [FeatureSeaIslands, | 
| Konstantin Zhuravlyov | 40b09e8 | 2018-02-27 21:46:15 +0000 | [diff] [blame] | 580 | FeatureLDSBankCount16, | 
|  | 581 | FeatureFastFMAF32]>; | 
| Matt Arsenault | f3dd863 | 2016-11-01 00:55:14 +0000 | [diff] [blame] | 582 |  | 
| Wei Ding | 7c3e511 | 2017-06-10 03:53:19 +0000 | [diff] [blame] | 583 | def FeatureISAVersion7_0_3 : SubtargetFeatureISAVersion <7,0,3, | 
|  | 584 | [FeatureSeaIslands, | 
|  | 585 | FeatureLDSBankCount16]>; | 
|  | 586 |  | 
| Konstantin Zhuravlyov | c40d9f2 | 2017-12-08 20:52:28 +0000 | [diff] [blame] | 587 | def FeatureISAVersion7_0_4 : SubtargetFeatureISAVersion <7,0,4, | 
|  | 588 | [FeatureSeaIslands, | 
|  | 589 | FeatureLDSBankCount32]>; | 
|  | 590 |  | 
| Yaxun Liu | 94add85 | 2016-10-26 16:37:56 +0000 | [diff] [blame] | 591 | def FeatureISAVersion8_0_1 : SubtargetFeatureISAVersion <8,0,1, | 
|  | 592 | [FeatureVolcanicIslands, | 
| Konstantin Zhuravlyov | 6810765 | 2017-08-24 20:03:07 +0000 | [diff] [blame] | 593 | FeatureFastFMAF32, | 
|  | 594 | HalfRate64Ops, | 
| Yaxun Liu | 94add85 | 2016-10-26 16:37:56 +0000 | [diff] [blame] | 595 | FeatureLDSBankCount32, | 
| Changpeng Fang | 44dfa1d | 2018-01-12 21:12:19 +0000 | [diff] [blame] | 596 | FeatureXNACK, | 
|  | 597 | FeatureUnpackedD16VMem]>; | 
| Matt Arsenault | f3dd863 | 2016-11-01 00:55:14 +0000 | [diff] [blame] | 598 |  | 
| Yaxun Liu | 94add85 | 2016-10-26 16:37:56 +0000 | [diff] [blame] | 599 | def FeatureISAVersion8_0_2 : SubtargetFeatureISAVersion <8,0,2, | 
|  | 600 | [FeatureVolcanicIslands, | 
|  | 601 | FeatureLDSBankCount32, | 
| Changpeng Fang | 44dfa1d | 2018-01-12 21:12:19 +0000 | [diff] [blame] | 602 | FeatureSGPRInitBug, | 
|  | 603 | FeatureUnpackedD16VMem]>; | 
| Matt Arsenault | f3dd863 | 2016-11-01 00:55:14 +0000 | [diff] [blame] | 604 |  | 
| Yaxun Liu | 94add85 | 2016-10-26 16:37:56 +0000 | [diff] [blame] | 605 | def FeatureISAVersion8_0_3 : SubtargetFeatureISAVersion <8,0,3, | 
|  | 606 | [FeatureVolcanicIslands, | 
| Changpeng Fang | 44dfa1d | 2018-01-12 21:12:19 +0000 | [diff] [blame] | 607 | FeatureLDSBankCount32, | 
|  | 608 | FeatureUnpackedD16VMem]>; | 
| Matt Arsenault | f3dd863 | 2016-11-01 00:55:14 +0000 | [diff] [blame] | 609 |  | 
| Yaxun Liu | 94add85 | 2016-10-26 16:37:56 +0000 | [diff] [blame] | 610 | def FeatureISAVersion8_1_0 : SubtargetFeatureISAVersion <8,1,0, | 
|  | 611 | [FeatureVolcanicIslands, | 
|  | 612 | FeatureLDSBankCount16, | 
|  | 613 | FeatureXNACK]>; | 
|  | 614 |  | 
| Wei Ding | 7c3e511 | 2017-06-10 03:53:19 +0000 | [diff] [blame] | 615 | def FeatureISAVersion9_0_0 : SubtargetFeatureISAVersion <9,0,0, | 
|  | 616 | [FeatureGFX9, | 
| Matt Arsenault | 28f52e5 | 2017-10-25 07:00:51 +0000 | [diff] [blame] | 617 | FeatureMadMixInsts, | 
| Konstantin Zhuravlyov | c2c2eb7 | 2018-05-04 20:06:57 +0000 | [diff] [blame] | 618 | FeatureLDSBankCount32, | 
|  | 619 | FeatureD16PreservesUnusedBits | 
| Matt Arsenault | 28f52e5 | 2017-10-25 07:00:51 +0000 | [diff] [blame] | 620 | ]>; | 
| Wei Ding | 7c3e511 | 2017-06-10 03:53:19 +0000 | [diff] [blame] | 621 |  | 
| Wei Ding | 7c3e511 | 2017-06-10 03:53:19 +0000 | [diff] [blame] | 622 | def FeatureISAVersion9_0_2 : SubtargetFeatureISAVersion <9,0,2, | 
|  | 623 | [FeatureGFX9, | 
| Matt Arsenault | 28f52e5 | 2017-10-25 07:00:51 +0000 | [diff] [blame] | 624 | FeatureMadMixInsts, | 
| Konstantin Zhuravlyov | 331f97e17 | 2018-02-16 21:26:25 +0000 | [diff] [blame] | 625 | FeatureLDSBankCount32, | 
| Konstantin Zhuravlyov | c2c2eb7 | 2018-05-04 20:06:57 +0000 | [diff] [blame] | 626 | FeatureXNACK, | 
|  | 627 | FeatureD16PreservesUnusedBits | 
| Matt Arsenault | 28f52e5 | 2017-10-25 07:00:51 +0000 | [diff] [blame] | 628 | ]>; | 
| Wei Ding | 7c3e511 | 2017-06-10 03:53:19 +0000 | [diff] [blame] | 629 |  | 
| Matt Arsenault | 0084adc | 2018-04-30 19:08:16 +0000 | [diff] [blame] | 630 | def FeatureISAVersion9_0_4 : SubtargetFeatureISAVersion <9,0,4, | 
|  | 631 | [FeatureGFX9, | 
|  | 632 | FeatureLDSBankCount32, | 
| Konstantin Zhuravlyov | c2c2eb7 | 2018-05-04 20:06:57 +0000 | [diff] [blame] | 633 | FeatureFmaMixInsts, | 
|  | 634 | FeatureD16PreservesUnusedBits]>; | 
| Matt Arsenault | 0084adc | 2018-04-30 19:08:16 +0000 | [diff] [blame] | 635 |  | 
|  | 636 | def FeatureISAVersion9_0_6 : SubtargetFeatureISAVersion <9,0,6, | 
|  | 637 | [FeatureGFX9, | 
|  | 638 | HalfRate64Ops, | 
|  | 639 | FeatureFmaMixInsts, | 
|  | 640 | FeatureLDSBankCount32, | 
|  | 641 | FeatureDLInsts]>; | 
|  | 642 |  | 
| Tom Stellard | 3498e4f | 2013-06-07 20:28:55 +0000 | [diff] [blame] | 643 | //===----------------------------------------------------------------------===// | 
| Konstantin Zhuravlyov | 8c273ad | 2016-04-18 16:28:23 +0000 | [diff] [blame] | 644 | // Debugger related subtarget features. | 
|  | 645 | //===----------------------------------------------------------------------===// | 
|  | 646 |  | 
|  | 647 | def FeatureDebuggerInsertNops : SubtargetFeature< | 
|  | 648 | "amdgpu-debugger-insert-nops", | 
|  | 649 | "DebuggerInsertNops", | 
|  | 650 | "true", | 
| Konstantin Zhuravlyov | e3d322a | 2016-05-13 18:21:28 +0000 | [diff] [blame] | 651 | "Insert one nop instruction for each high level source statement" | 
| Konstantin Zhuravlyov | 8c273ad | 2016-04-18 16:28:23 +0000 | [diff] [blame] | 652 | >; | 
|  | 653 |  | 
| Konstantin Zhuravlyov | 29ddd2b | 2016-05-24 18:37:18 +0000 | [diff] [blame] | 654 | def FeatureDebuggerReserveRegs : SubtargetFeature< | 
|  | 655 | "amdgpu-debugger-reserve-regs", | 
|  | 656 | "DebuggerReserveRegs", | 
| Konstantin Zhuravlyov | 1d99c4d | 2016-04-26 15:43:14 +0000 | [diff] [blame] | 657 | "true", | 
| Konstantin Zhuravlyov | 29ddd2b | 2016-05-24 18:37:18 +0000 | [diff] [blame] | 658 | "Reserve registers for debugger usage" | 
| Konstantin Zhuravlyov | 1d99c4d | 2016-04-26 15:43:14 +0000 | [diff] [blame] | 659 | >; | 
|  | 660 |  | 
| Konstantin Zhuravlyov | f2f3d14 | 2016-06-25 03:11:28 +0000 | [diff] [blame] | 661 | def FeatureDebuggerEmitPrologue : SubtargetFeature< | 
|  | 662 | "amdgpu-debugger-emit-prologue", | 
|  | 663 | "DebuggerEmitPrologue", | 
|  | 664 | "true", | 
|  | 665 | "Emit debugger prologue" | 
|  | 666 | >; | 
|  | 667 |  | 
| Konstantin Zhuravlyov | 8c273ad | 2016-04-18 16:28:23 +0000 | [diff] [blame] | 668 | //===----------------------------------------------------------------------===// | 
| Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 669 |  | 
|  | 670 | def AMDGPUInstrInfo : InstrInfo { | 
|  | 671 | let guessInstructionProperties = 1; | 
| Matt Arsenault | 1ecac06 | 2015-02-18 02:15:32 +0000 | [diff] [blame] | 672 | let noNamedPositionallyEncodedOperands = 1; | 
| Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 673 | } | 
|  | 674 |  | 
| Tom Stellard | 9d7ddd5 | 2014-11-14 14:08:00 +0000 | [diff] [blame] | 675 | def AMDGPUAsmParser : AsmParser { | 
|  | 676 | // Some of the R600 registers have the same name, so this crashes. | 
|  | 677 | // For example T0_XYZW and T0_XY both have the asm name T0. | 
|  | 678 | let ShouldEmitMatchRegisterName = 0; | 
|  | 679 | } | 
|  | 680 |  | 
| Konstantin Zhuravlyov | da4687c | 2016-09-27 14:42:48 +0000 | [diff] [blame] | 681 | def AMDGPUAsmWriter : AsmWriter { | 
|  | 682 | int PassSubtarget = 1; | 
|  | 683 | } | 
|  | 684 |  | 
| Sam Kolton | d63d8a7 | 2016-09-09 09:37:51 +0000 | [diff] [blame] | 685 | def AMDGPUAsmVariants { | 
|  | 686 | string Default = "Default"; | 
|  | 687 | int Default_ID = 0; | 
|  | 688 | string VOP3 = "VOP3"; | 
|  | 689 | int VOP3_ID = 1; | 
|  | 690 | string SDWA = "SDWA"; | 
|  | 691 | int SDWA_ID = 2; | 
| Sam Kolton | f7659d71 | 2017-05-23 10:08:55 +0000 | [diff] [blame] | 692 | string SDWA9 = "SDWA9"; | 
|  | 693 | int SDWA9_ID = 3; | 
| Sam Kolton | d63d8a7 | 2016-09-09 09:37:51 +0000 | [diff] [blame] | 694 | string DPP = "DPP"; | 
| Sam Kolton | f7659d71 | 2017-05-23 10:08:55 +0000 | [diff] [blame] | 695 | int DPP_ID = 4; | 
| Sam Kolton | fb0d9d9 | 2016-09-12 14:42:43 +0000 | [diff] [blame] | 696 | string Disable = "Disable"; | 
| Sam Kolton | f7659d71 | 2017-05-23 10:08:55 +0000 | [diff] [blame] | 697 | int Disable_ID = 5; | 
| Sam Kolton | d63d8a7 | 2016-09-09 09:37:51 +0000 | [diff] [blame] | 698 | } | 
|  | 699 |  | 
|  | 700 | def DefaultAMDGPUAsmParserVariant : AsmParserVariant { | 
|  | 701 | let Variant = AMDGPUAsmVariants.Default_ID; | 
|  | 702 | let Name = AMDGPUAsmVariants.Default; | 
|  | 703 | } | 
|  | 704 |  | 
|  | 705 | def VOP3AsmParserVariant : AsmParserVariant { | 
|  | 706 | let Variant = AMDGPUAsmVariants.VOP3_ID; | 
|  | 707 | let Name = AMDGPUAsmVariants.VOP3; | 
|  | 708 | } | 
|  | 709 |  | 
|  | 710 | def SDWAAsmParserVariant : AsmParserVariant { | 
|  | 711 | let Variant = AMDGPUAsmVariants.SDWA_ID; | 
|  | 712 | let Name = AMDGPUAsmVariants.SDWA; | 
|  | 713 | } | 
|  | 714 |  | 
| Sam Kolton | f7659d71 | 2017-05-23 10:08:55 +0000 | [diff] [blame] | 715 | def SDWA9AsmParserVariant : AsmParserVariant { | 
|  | 716 | let Variant = AMDGPUAsmVariants.SDWA9_ID; | 
|  | 717 | let Name = AMDGPUAsmVariants.SDWA9; | 
|  | 718 | } | 
|  | 719 |  | 
|  | 720 |  | 
| Sam Kolton | d63d8a7 | 2016-09-09 09:37:51 +0000 | [diff] [blame] | 721 | def DPPAsmParserVariant : AsmParserVariant { | 
|  | 722 | let Variant = AMDGPUAsmVariants.DPP_ID; | 
|  | 723 | let Name = AMDGPUAsmVariants.DPP; | 
|  | 724 | } | 
|  | 725 |  | 
| Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 726 | def AMDGPU : Target { | 
|  | 727 | // Pull in Instruction Info: | 
|  | 728 | let InstructionSet = AMDGPUInstrInfo; | 
| Tom Stellard | 9d7ddd5 | 2014-11-14 14:08:00 +0000 | [diff] [blame] | 729 | let AssemblyParsers = [AMDGPUAsmParser]; | 
| Sam Kolton | d63d8a7 | 2016-09-09 09:37:51 +0000 | [diff] [blame] | 730 | let AssemblyParserVariants = [DefaultAMDGPUAsmParserVariant, | 
|  | 731 | VOP3AsmParserVariant, | 
|  | 732 | SDWAAsmParserVariant, | 
| Sam Kolton | f7659d71 | 2017-05-23 10:08:55 +0000 | [diff] [blame] | 733 | SDWA9AsmParserVariant, | 
| Sam Kolton | d63d8a7 | 2016-09-09 09:37:51 +0000 | [diff] [blame] | 734 | DPPAsmParserVariant]; | 
| Konstantin Zhuravlyov | da4687c | 2016-09-27 14:42:48 +0000 | [diff] [blame] | 735 | let AssemblyWriters = [AMDGPUAsmWriter]; | 
| Geoff Berry | f8bf2ec | 2018-02-23 18:25:08 +0000 | [diff] [blame] | 736 | let AllowRegisterRenaming = 1; | 
| Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 737 | } | 
|  | 738 |  | 
| Tom Stellard | bc5b537 | 2014-06-13 16:38:59 +0000 | [diff] [blame] | 739 | // Dummy Instruction itineraries for pseudo instructions | 
|  | 740 | def ALU_NULL : FuncUnit; | 
|  | 741 | def NullALU : InstrItinClass; | 
|  | 742 |  | 
| Tom Stellard | 0e70de5 | 2014-05-16 20:56:45 +0000 | [diff] [blame] | 743 | //===----------------------------------------------------------------------===// | 
|  | 744 | // Predicate helper class | 
|  | 745 | //===----------------------------------------------------------------------===// | 
|  | 746 |  | 
| Tom Stellard | d1f0f02 | 2015-04-23 19:33:54 +0000 | [diff] [blame] | 747 | def TruePredicate : Predicate<"true">; | 
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 748 |  | 
| Tom Stellard | d1f0f02 | 2015-04-23 19:33:54 +0000 | [diff] [blame] | 749 | def isSICI : Predicate< | 
|  | 750 | "Subtarget->getGeneration() == AMDGPUSubtarget::SOUTHERN_ISLANDS ||" | 
|  | 751 | "Subtarget->getGeneration() == AMDGPUSubtarget::SEA_ISLANDS" | 
| Matt Arsenault | 8728c5f | 2017-08-07 14:58:04 +0000 | [diff] [blame] | 752 | >, AssemblerPredicate<"!FeatureGCN3Encoding">; | 
| Tom Stellard | d1f0f02 | 2015-04-23 19:33:54 +0000 | [diff] [blame] | 753 |  | 
| Tom Stellard | 5ebdfbe | 2015-12-24 03:18:18 +0000 | [diff] [blame] | 754 | def isVI : Predicate < | 
|  | 755 | "Subtarget->getGeneration() >= AMDGPUSubtarget::VOLCANIC_ISLANDS">, | 
|  | 756 | AssemblerPredicate<"FeatureGCN3Encoding">; | 
|  | 757 |  | 
| Matt Arsenault | 2021f08 | 2017-02-18 19:12:26 +0000 | [diff] [blame] | 758 | def isGFX9 : Predicate < | 
|  | 759 | "Subtarget->getGeneration() >= AMDGPUSubtarget::GFX9">, | 
|  | 760 | AssemblerPredicate<"FeatureGFX9Insts">; | 
|  | 761 |  | 
| Matt Arsenault | e823d92 | 2017-02-18 18:29:53 +0000 | [diff] [blame] | 762 | // TODO: Either the name to be changed or we simply use IsCI! | 
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 763 | def isCIVI : Predicate < | 
| Matt Arsenault | e823d92 | 2017-02-18 18:29:53 +0000 | [diff] [blame] | 764 | "Subtarget->getGeneration() >= AMDGPUSubtarget::SEA_ISLANDS">, | 
|  | 765 | AssemblerPredicate<"FeatureCIInsts">; | 
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 766 |  | 
| Matt Arsenault | 9698f1c | 2017-06-20 19:54:14 +0000 | [diff] [blame] | 767 | def HasFlatAddressSpace : Predicate<"Subtarget->hasFlatAddressSpace()">, | 
|  | 768 | AssemblerPredicate<"FeatureFlatAddressSpace">; | 
|  | 769 |  | 
|  | 770 | def HasFlatGlobalInsts : Predicate<"Subtarget->hasFlatGlobalInsts()">, | 
|  | 771 | AssemblerPredicate<"FeatureFlatGlobalInsts">; | 
| Matt Arsenault | ca7b0a1 | 2017-07-21 15:36:16 +0000 | [diff] [blame] | 772 | def HasFlatScratchInsts : Predicate<"Subtarget->hasFlatScratchInsts()">, | 
|  | 773 | AssemblerPredicate<"FeatureFlatScratchInsts">; | 
| Matt Arsenault | ed6e8f0 | 2017-09-01 18:36:06 +0000 | [diff] [blame] | 774 | def HasD16LoadStore : Predicate<"Subtarget->hasD16LoadStore()">, | 
|  | 775 | AssemblerPredicate<"FeatureGFX9Insts">; | 
| Matt Arsenault | 382d945 | 2016-01-26 04:49:22 +0000 | [diff] [blame] | 776 |  | 
| Changpeng Fang | 44dfa1d | 2018-01-12 21:12:19 +0000 | [diff] [blame] | 777 | def HasUnpackedD16VMem : Predicate<"Subtarget->hasUnpackedD16VMem()">, | 
|  | 778 | AssemblerPredicate<"FeatureUnpackedD16VMem">; | 
|  | 779 | def HasPackedD16VMem : Predicate<"!Subtarget->hasUnpackedD16VMem()">, | 
|  | 780 | AssemblerPredicate<"!FeatureUnpackedD16VMem">; | 
|  | 781 |  | 
| Konstantin Zhuravlyov | c2c2eb7 | 2018-05-04 20:06:57 +0000 | [diff] [blame] | 782 | def D16PreservesUnusedBits : Predicate<"Subtarget->d16PreservesUnusedBits()">, | 
|  | 783 | AssemblerPredicate<"FeatureD16PreservesUnusedBits">; | 
| Matt Arsenault | 3f71c0e | 2017-11-29 00:55:57 +0000 | [diff] [blame] | 784 |  | 
|  | 785 | def LDSRequiresM0Init : Predicate<"Subtarget->ldsRequiresM0Init()">; | 
|  | 786 | def NotLDSRequiresM0Init : Predicate<"!Subtarget->ldsRequiresM0Init()">; | 
|  | 787 |  | 
| Matt Arsenault | efa1d65 | 2017-09-01 18:38:02 +0000 | [diff] [blame] | 788 | def HasDSAddTid : Predicate<"Subtarget->getGeneration() >= AMDGPUSubtarget::GFX9">, | 
|  | 789 | AssemblerPredicate<"FeatureGFX9Insts">; | 
|  | 790 |  | 
| Matt Arsenault | c37fe66 | 2017-07-20 17:42:47 +0000 | [diff] [blame] | 791 | def HasAddNoCarryInsts : Predicate<"Subtarget->hasAddNoCarryInsts()">, | 
|  | 792 | AssemblerPredicate<"FeatureAddNoCarryInsts">; | 
|  | 793 |  | 
|  | 794 | def NotHasAddNoCarryInsts : Predicate<"!Subtarget->hasAddNoCarryInsts()">, | 
|  | 795 | AssemblerPredicate<"!FeatureAddNoCarryInsts">; | 
|  | 796 |  | 
| Matt Arsenault | 9be7b0d | 2017-02-27 18:49:11 +0000 | [diff] [blame] | 797 | def Has16BitInsts : Predicate<"Subtarget->has16BitInsts()">, | 
|  | 798 | AssemblerPredicate<"Feature16BitInsts">; | 
|  | 799 | def HasVOP3PInsts : Predicate<"Subtarget->hasVOP3PInsts()">, | 
|  | 800 | AssemblerPredicate<"FeatureVOP3P">; | 
| Tom Stellard | 115a615 | 2016-11-10 16:02:37 +0000 | [diff] [blame] | 801 |  | 
| Sam Kolton | 07dbde2 | 2017-01-20 10:01:25 +0000 | [diff] [blame] | 802 | def HasSDWA : Predicate<"Subtarget->hasSDWA()">, | 
| Sam Kolton | f7659d71 | 2017-05-23 10:08:55 +0000 | [diff] [blame] | 803 | AssemblerPredicate<"FeatureSDWA,FeatureVolcanicIslands">; | 
|  | 804 |  | 
|  | 805 | def HasSDWA9 : Predicate<"Subtarget->hasSDWA()">, | 
|  | 806 | AssemblerPredicate<"FeatureSDWA,FeatureGFX9">; | 
| Sam Kolton | 07dbde2 | 2017-01-20 10:01:25 +0000 | [diff] [blame] | 807 |  | 
|  | 808 | def HasDPP : Predicate<"Subtarget->hasDPP()">, | 
|  | 809 | AssemblerPredicate<"FeatureDPP">; | 
|  | 810 |  | 
| Dmitry Preobrazhensky | ff64aa5 | 2017-08-16 13:51:56 +0000 | [diff] [blame] | 811 | def HasIntClamp : Predicate<"Subtarget->hasIntClamp()">, | 
|  | 812 | AssemblerPredicate<"FeatureIntClamp">; | 
|  | 813 |  | 
| Matt Arsenault | 28f52e5 | 2017-10-25 07:00:51 +0000 | [diff] [blame] | 814 | def HasMadMixInsts : Predicate<"Subtarget->hasMadMixInsts()">, | 
|  | 815 | AssemblerPredicate<"FeatureMadMixInsts">; | 
| Matt Arsenault | d7e2303 | 2017-09-07 18:05:07 +0000 | [diff] [blame] | 816 |  | 
| Dmitry Preobrazhensky | 6bad04e | 2018-04-02 16:10:25 +0000 | [diff] [blame] | 817 | def HasScalarAtomics : Predicate<"Subtarget->hasScalarAtomics()">, | 
|  | 818 | AssemblerPredicate<"FeatureScalarAtomics">; | 
|  | 819 |  | 
| Matt Arsenault | 8474803 | 2018-04-26 19:21:26 +0000 | [diff] [blame] | 820 | def has16BankLDS : Predicate<"Subtarget->getLDSBankCount() == 16">; | 
|  | 821 | def has32BankLDS : Predicate<"Subtarget->getLDSBankCount() == 32">; | 
|  | 822 | def HasVGPRIndexMode : Predicate<"Subtarget->hasVGPRIndexMode()">, | 
|  | 823 | AssemblerPredicate<"FeatureVGPRIndexMode">; | 
|  | 824 | def HasMovrel : Predicate<"Subtarget->hasMovrel()">, | 
|  | 825 | AssemblerPredicate<"FeatureMovrel">; | 
|  | 826 |  | 
| Matt Arsenault | 0084adc | 2018-04-30 19:08:16 +0000 | [diff] [blame] | 827 | def HasFmaMixInsts : Predicate<"Subtarget->hasFmaMixInsts()">, | 
|  | 828 | AssemblerPredicate<"FeatureFmaMixInsts">; | 
|  | 829 |  | 
|  | 830 | def HasDLInsts : Predicate<"Subtarget->hasDLInsts()">, | 
|  | 831 | AssemblerPredicate<"FeatureDLInsts">; | 
|  | 832 |  | 
|  | 833 |  | 
| Matt Arsenault | cc85223 | 2017-10-10 20:22:07 +0000 | [diff] [blame] | 834 | def EnableLateCFGStructurize : Predicate< | 
|  | 835 | "EnableLateStructurizeCFG">; | 
| Matt Arsenault | 90c7593 | 2017-10-03 00:06:41 +0000 | [diff] [blame] | 836 |  | 
|  | 837 | // Exists to help track down where SubtargetPredicate isn't set rather | 
|  | 838 | // than letting tablegen crash with an unhelpful error. | 
|  | 839 | def InvalidPred : Predicate<"predicate not set on instruction or pattern">; | 
|  | 840 |  | 
| Tom Stellard | 0e70de5 | 2014-05-16 20:56:45 +0000 | [diff] [blame] | 841 | class PredicateControl { | 
| Matt Arsenault | 90c7593 | 2017-10-03 00:06:41 +0000 | [diff] [blame] | 842 | Predicate SubtargetPredicate = InvalidPred; | 
| Tom Stellard | d1f0f02 | 2015-04-23 19:33:54 +0000 | [diff] [blame] | 843 | Predicate SIAssemblerPredicate = isSICI; | 
| Tom Stellard | 5ebdfbe | 2015-12-24 03:18:18 +0000 | [diff] [blame] | 844 | Predicate VIAssemblerPredicate = isVI; | 
| Tom Stellard | d7e6f13 | 2015-04-08 01:09:26 +0000 | [diff] [blame] | 845 | list<Predicate> AssemblerPredicates = []; | 
| Tom Stellard | d1f0f02 | 2015-04-23 19:33:54 +0000 | [diff] [blame] | 846 | Predicate AssemblerPredicate = TruePredicate; | 
| Tom Stellard | 0e70de5 | 2014-05-16 20:56:45 +0000 | [diff] [blame] | 847 | list<Predicate> OtherPredicates = []; | 
| Matt Arsenault | 90c7593 | 2017-10-03 00:06:41 +0000 | [diff] [blame] | 848 | list<Predicate> Predicates = !listconcat([SubtargetPredicate, | 
|  | 849 | AssemblerPredicate], | 
| Tom Stellard | d7e6f13 | 2015-04-08 01:09:26 +0000 | [diff] [blame] | 850 | AssemblerPredicates, | 
| Tom Stellard | 0e70de5 | 2014-05-16 20:56:45 +0000 | [diff] [blame] | 851 | OtherPredicates); | 
|  | 852 | } | 
|  | 853 |  | 
| Matt Arsenault | 90c7593 | 2017-10-03 00:06:41 +0000 | [diff] [blame] | 854 | class AMDGPUPat<dag pattern, dag result> : Pat<pattern, result>, | 
|  | 855 | PredicateControl; | 
|  | 856 |  | 
|  | 857 |  | 
| Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 858 | // Include AMDGPU TD files | 
|  | 859 | include "R600Schedule.td" | 
| Konstantin Zhuravlyov | 27b0a03 | 2017-11-10 20:01:58 +0000 | [diff] [blame] | 860 | include "R600Processors.td" | 
| Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 861 | include "SISchedule.td" | 
| Konstantin Zhuravlyov | 27b0a03 | 2017-11-10 20:01:58 +0000 | [diff] [blame] | 862 | include "GCNProcessors.td" | 
| Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 863 | include "AMDGPUInstrInfo.td" | 
|  | 864 | include "AMDGPUIntrinsics.td" | 
|  | 865 | include "AMDGPURegisterInfo.td" | 
| Tom Stellard | ca16621 | 2017-01-30 21:56:46 +0000 | [diff] [blame] | 866 | include "AMDGPURegisterBanks.td" | 
| Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 867 | include "AMDGPUInstructions.td" | 
| Christian Konig | 2c8f6d5 | 2013-03-07 09:03:52 +0000 | [diff] [blame] | 868 | include "AMDGPUCallingConv.td" | 
| Nicolai Haehnle | 5d0d303 | 2018-04-01 17:09:07 +0000 | [diff] [blame] | 869 | include "AMDGPUSearchableTables.td" |