Matt Arsenault | 585b566 | 2015-05-07 17:02:32 +0000 | [diff] [blame] | 1 | //===-- AMDGPU.td - AMDGPU Tablegen files ------------------*- tablegen -*-===// |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
| 7 | // |
Matt Arsenault | 585b566 | 2015-05-07 17:02:32 +0000 | [diff] [blame] | 8 | //===----------------------------------------------------------------------===// |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 9 | |
Tom Stellard | bc5b537 | 2014-06-13 16:38:59 +0000 | [diff] [blame] | 10 | include "llvm/Target/Target.td" |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 11 | |
Tom Stellard | 9979277 | 2013-06-07 20:28:49 +0000 | [diff] [blame] | 12 | //===----------------------------------------------------------------------===// |
| 13 | // Subtarget Features |
| 14 | //===----------------------------------------------------------------------===// |
| 15 | |
Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 16 | // Debugging Features |
| 17 | |
| 18 | def FeatureDumpCode : SubtargetFeature <"DumpCode", |
| 19 | "DumpCode", |
| 20 | "true", |
| 21 | "Dump MachineInstrs in the CodeEmitter">; |
| 22 | |
Tom Stellard | 0a0fa03 | 2015-04-28 17:37:00 +0000 | [diff] [blame] | 23 | def FeatureDumpCodeLower : SubtargetFeature <"dumpcode", |
| 24 | "DumpCode", |
| 25 | "true", |
| 26 | "Dump MachineInstrs in the CodeEmitter">; |
| 27 | |
Tom Stellard | 66df8a2 | 2013-11-18 19:43:44 +0000 | [diff] [blame] | 28 | def FeatureIRStructurizer : SubtargetFeature <"disable-irstructurizer", |
Tom Stellard | ed0ceec | 2013-10-10 17:11:12 +0000 | [diff] [blame] | 29 | "EnableIRStructurizer", |
Tom Stellard | 66df8a2 | 2013-11-18 19:43:44 +0000 | [diff] [blame] | 30 | "false", |
| 31 | "Disable IR Structurizer">; |
Tom Stellard | ed0ceec | 2013-10-10 17:11:12 +0000 | [diff] [blame] | 32 | |
Matt Arsenault | d9a23ab | 2014-07-13 02:08:26 +0000 | [diff] [blame] | 33 | def FeaturePromoteAlloca : SubtargetFeature <"promote-alloca", |
| 34 | "EnablePromoteAlloca", |
| 35 | "true", |
| 36 | "Enable promote alloca pass">; |
| 37 | |
Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 38 | // Target features |
| 39 | |
Tom Stellard | 783893a | 2013-11-18 19:43:33 +0000 | [diff] [blame] | 40 | def FeatureIfCvt : SubtargetFeature <"disable-ifcvt", |
| 41 | "EnableIfCvt", |
| 42 | "false", |
| 43 | "Disable the if conversion pass">; |
| 44 | |
Matt Arsenault | f5e2997 | 2014-06-20 06:50:05 +0000 | [diff] [blame] | 45 | def FeatureFP64 : SubtargetFeature<"fp64", |
Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 46 | "FP64", |
Tom Stellard | 9979277 | 2013-06-07 20:28:49 +0000 | [diff] [blame] | 47 | "true", |
Matt Arsenault | f5e2997 | 2014-06-20 06:50:05 +0000 | [diff] [blame] | 48 | "Enable double precision operations">; |
Tom Stellard | 9979277 | 2013-06-07 20:28:49 +0000 | [diff] [blame] | 49 | |
Matt Arsenault | f171cf2 | 2014-07-14 23:40:49 +0000 | [diff] [blame] | 50 | def FeatureFP64Denormals : SubtargetFeature<"fp64-denormals", |
| 51 | "FP64Denormals", |
| 52 | "true", |
| 53 | "Enable double precision denormal handling", |
| 54 | [FeatureFP64]>; |
| 55 | |
Matt Arsenault | b035a57 | 2015-01-29 19:34:25 +0000 | [diff] [blame] | 56 | def FeatureFastFMAF32 : SubtargetFeature<"fast-fmaf", |
| 57 | "FastFMAF32", |
| 58 | "true", |
| 59 | "Assuming f32 fma is at least as fast as mul + add", |
| 60 | []>; |
| 61 | |
Matt Arsenault | f171cf2 | 2014-07-14 23:40:49 +0000 | [diff] [blame] | 62 | // Some instructions do not support denormals despite this flag. Using |
| 63 | // fp32 denormals also causes instructions to run at the double |
| 64 | // precision rate for the device. |
| 65 | def FeatureFP32Denormals : SubtargetFeature<"fp32-denormals", |
| 66 | "FP32Denormals", |
| 67 | "true", |
| 68 | "Enable single precision denormal handling">; |
| 69 | |
Tom Stellard | 9979277 | 2013-06-07 20:28:49 +0000 | [diff] [blame] | 70 | def Feature64BitPtr : SubtargetFeature<"64BitPtr", |
| 71 | "Is64bit", |
Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 72 | "true", |
Matt Arsenault | f5e2997 | 2014-06-20 06:50:05 +0000 | [diff] [blame] | 73 | "Specify if 64-bit addressing should be used">; |
Tom Stellard | 9979277 | 2013-06-07 20:28:49 +0000 | [diff] [blame] | 74 | |
| 75 | def FeatureR600ALUInst : SubtargetFeature<"R600ALUInst", |
| 76 | "R600ALUInst", |
| 77 | "false", |
Matt Arsenault | f5e2997 | 2014-06-20 06:50:05 +0000 | [diff] [blame] | 78 | "Older version of ALU instructions encoding">; |
Tom Stellard | 9979277 | 2013-06-07 20:28:49 +0000 | [diff] [blame] | 79 | |
| 80 | def FeatureVertexCache : SubtargetFeature<"HasVertexCache", |
| 81 | "HasVertexCache", |
| 82 | "true", |
Matt Arsenault | f5e2997 | 2014-06-20 06:50:05 +0000 | [diff] [blame] | 83 | "Specify use of dedicated vertex cache">; |
Tom Stellard | 9979277 | 2013-06-07 20:28:49 +0000 | [diff] [blame] | 84 | |
Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 85 | def FeatureCaymanISA : SubtargetFeature<"caymanISA", |
| 86 | "CaymanISA", |
| 87 | "true", |
| 88 | "Use Cayman ISA">; |
| 89 | |
Tom Stellard | 348273d | 2014-01-23 16:18:02 +0000 | [diff] [blame] | 90 | def FeatureCFALUBug : SubtargetFeature<"cfalubug", |
| 91 | "CFALUBug", |
| 92 | "true", |
| 93 | "GPU has CF_ALU bug">; |
| 94 | |
Matt Arsenault | 4103328 | 2014-10-10 22:01:59 +0000 | [diff] [blame] | 95 | // XXX - This should probably be removed once enabled by default |
| 96 | def FeatureEnableLoadStoreOpt : SubtargetFeature <"load-store-opt", |
| 97 | "EnableLoadStoreOpt", |
| 98 | "true", |
| 99 | "Enable SI load/store optimizer pass">; |
| 100 | |
Matt Arsenault | 3f98140 | 2014-09-15 15:41:53 +0000 | [diff] [blame] | 101 | def FeatureFlatAddressSpace : SubtargetFeature<"flat-address-space", |
| 102 | "FlatAddressSpace", |
| 103 | "true", |
| 104 | "Support flat address space">; |
| 105 | |
Tom Stellard | e99fb65 | 2015-01-20 19:33:04 +0000 | [diff] [blame] | 106 | def FeatureVGPRSpilling : SubtargetFeature<"vgpr-spilling", |
| 107 | "EnableVGPRSpilling", |
| 108 | "true", |
| 109 | "Enable spilling of VGPRs to scratch memory">; |
| 110 | |
Marek Olsak | 4d00dd2 | 2015-03-09 15:48:09 +0000 | [diff] [blame] | 111 | def FeatureSGPRInitBug : SubtargetFeature<"sgpr-init-bug", |
| 112 | "SGPRInitBug", |
| 113 | "true", |
| 114 | "VI SGPR initilization bug requiring a fixed SGPR allocation size">; |
| 115 | |
Tom Stellard | 3498e4f | 2013-06-07 20:28:55 +0000 | [diff] [blame] | 116 | class SubtargetFeatureFetchLimit <string Value> : |
| 117 | SubtargetFeature <"fetch"#Value, |
| 118 | "TexVTXClauseSize", |
| 119 | Value, |
| 120 | "Limit the maximum number of fetches in a clause to "#Value>; |
Tom Stellard | 9979277 | 2013-06-07 20:28:49 +0000 | [diff] [blame] | 121 | |
Tom Stellard | 3498e4f | 2013-06-07 20:28:55 +0000 | [diff] [blame] | 122 | def FeatureFetchLimit8 : SubtargetFeatureFetchLimit <"8">; |
| 123 | def FeatureFetchLimit16 : SubtargetFeatureFetchLimit <"16">; |
| 124 | |
Tom Stellard | 8c347b0 | 2014-01-22 21:55:40 +0000 | [diff] [blame] | 125 | class SubtargetFeatureWavefrontSize <int Value> : SubtargetFeature< |
| 126 | "wavefrontsize"#Value, |
| 127 | "WavefrontSize", |
| 128 | !cast<string>(Value), |
| 129 | "The number of threads per wavefront">; |
| 130 | |
| 131 | def FeatureWavefrontSize16 : SubtargetFeatureWavefrontSize<16>; |
| 132 | def FeatureWavefrontSize32 : SubtargetFeatureWavefrontSize<32>; |
| 133 | def FeatureWavefrontSize64 : SubtargetFeatureWavefrontSize<64>; |
| 134 | |
Tom Stellard | ec87f84 | 2015-05-25 16:15:54 +0000 | [diff] [blame] | 135 | class SubtargetFeatureLDSBankCount <int Value> : SubtargetFeature < |
| 136 | "ldsbankcount"#Value, |
| 137 | "LDSBankCount", |
| 138 | !cast<string>(Value), |
| 139 | "The number of LDS banks per compute unit.">; |
| 140 | |
| 141 | def FeatureLDSBankCount16 : SubtargetFeatureLDSBankCount<16>; |
| 142 | def FeatureLDSBankCount32 : SubtargetFeatureLDSBankCount<32>; |
| 143 | |
Tom Stellard | 880a80a | 2014-06-17 16:53:14 +0000 | [diff] [blame] | 144 | class SubtargetFeatureLocalMemorySize <int Value> : SubtargetFeature< |
| 145 | "localmemorysize"#Value, |
| 146 | "LocalMemorySize", |
| 147 | !cast<string>(Value), |
| 148 | "The size of local memory in bytes">; |
| 149 | |
Tom Stellard | d7e6f13 | 2015-04-08 01:09:26 +0000 | [diff] [blame] | 150 | def FeatureGCN : SubtargetFeature<"gcn", |
| 151 | "IsGCN", |
| 152 | "true", |
| 153 | "GCN or newer GPU">; |
| 154 | |
| 155 | def FeatureGCN1Encoding : SubtargetFeature<"gcn1-encoding", |
| 156 | "GCN1Encoding", |
| 157 | "true", |
| 158 | "Encoding format for SI and CI">; |
| 159 | |
| 160 | def FeatureGCN3Encoding : SubtargetFeature<"gcn3-encoding", |
| 161 | "GCN3Encoding", |
| 162 | "true", |
| 163 | "Encoding format for VI">; |
Tom Stellard | d1f0f02 | 2015-04-23 19:33:54 +0000 | [diff] [blame] | 164 | |
| 165 | def FeatureCIInsts : SubtargetFeature<"ci-insts", |
| 166 | "CIInsts", |
| 167 | "true", |
| 168 | "Additional intstructions for CI+">; |
| 169 | |
| 170 | // Dummy feature used to disable assembler instructions. |
| 171 | def FeatureDisable : SubtargetFeature<"", |
| 172 | "FeatureDisable","true", |
| 173 | "Dummy feature to disable assembler" |
| 174 | " instructions">; |
| 175 | |
Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 176 | class SubtargetFeatureGeneration <string Value, |
| 177 | list<SubtargetFeature> Implies> : |
| 178 | SubtargetFeature <Value, "Gen", "AMDGPUSubtarget::"#Value, |
| 179 | Value#" GPU generation", Implies>; |
| 180 | |
Tom Stellard | 880a80a | 2014-06-17 16:53:14 +0000 | [diff] [blame] | 181 | def FeatureLocalMemorySize0 : SubtargetFeatureLocalMemorySize<0>; |
| 182 | def FeatureLocalMemorySize32768 : SubtargetFeatureLocalMemorySize<32768>; |
| 183 | def FeatureLocalMemorySize65536 : SubtargetFeatureLocalMemorySize<65536>; |
| 184 | |
Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 185 | def FeatureR600 : SubtargetFeatureGeneration<"R600", |
Tom Stellard | 880a80a | 2014-06-17 16:53:14 +0000 | [diff] [blame] | 186 | [FeatureR600ALUInst, FeatureFetchLimit8, FeatureLocalMemorySize0]>; |
Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 187 | |
| 188 | def FeatureR700 : SubtargetFeatureGeneration<"R700", |
Tom Stellard | 880a80a | 2014-06-17 16:53:14 +0000 | [diff] [blame] | 189 | [FeatureFetchLimit16, FeatureLocalMemorySize0]>; |
Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 190 | |
| 191 | def FeatureEvergreen : SubtargetFeatureGeneration<"EVERGREEN", |
Tom Stellard | 880a80a | 2014-06-17 16:53:14 +0000 | [diff] [blame] | 192 | [FeatureFetchLimit16, FeatureLocalMemorySize32768]>; |
Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 193 | |
| 194 | def FeatureNorthernIslands : SubtargetFeatureGeneration<"NORTHERN_ISLANDS", |
Tom Stellard | 880a80a | 2014-06-17 16:53:14 +0000 | [diff] [blame] | 195 | [FeatureFetchLimit16, FeatureWavefrontSize64, |
| 196 | FeatureLocalMemorySize32768] |
| 197 | >; |
Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 198 | |
| 199 | def FeatureSouthernIslands : SubtargetFeatureGeneration<"SOUTHERN_ISLANDS", |
Tom Stellard | 42639a5 | 2014-07-21 15:44:58 +0000 | [diff] [blame] | 200 | [Feature64BitPtr, FeatureFP64, FeatureLocalMemorySize32768, |
Tom Stellard | ec87f84 | 2015-05-25 16:15:54 +0000 | [diff] [blame] | 201 | FeatureWavefrontSize64, FeatureGCN, FeatureGCN1Encoding, |
| 202 | FeatureLDSBankCount32]>; |
Tom Stellard | a6c6e1b | 2013-06-07 20:37:48 +0000 | [diff] [blame] | 203 | |
Tom Stellard | 6e1ee47 | 2013-10-29 16:37:28 +0000 | [diff] [blame] | 204 | def FeatureSeaIslands : SubtargetFeatureGeneration<"SEA_ISLANDS", |
Tom Stellard | 42639a5 | 2014-07-21 15:44:58 +0000 | [diff] [blame] | 205 | [Feature64BitPtr, FeatureFP64, FeatureLocalMemorySize65536, |
Tom Stellard | d7e6f13 | 2015-04-08 01:09:26 +0000 | [diff] [blame] | 206 | FeatureWavefrontSize64, FeatureGCN, FeatureFlatAddressSpace, |
Tom Stellard | d1f0f02 | 2015-04-23 19:33:54 +0000 | [diff] [blame] | 207 | FeatureGCN1Encoding, FeatureCIInsts]>; |
Marek Olsak | 5df00d6 | 2014-12-07 12:18:57 +0000 | [diff] [blame] | 208 | |
| 209 | def FeatureVolcanicIslands : SubtargetFeatureGeneration<"VOLCANIC_ISLANDS", |
| 210 | [Feature64BitPtr, FeatureFP64, FeatureLocalMemorySize65536, |
Tom Stellard | d7e6f13 | 2015-04-08 01:09:26 +0000 | [diff] [blame] | 211 | FeatureWavefrontSize64, FeatureFlatAddressSpace, FeatureGCN, |
Tom Stellard | ec87f84 | 2015-05-25 16:15:54 +0000 | [diff] [blame] | 212 | FeatureGCN3Encoding, FeatureCIInsts, FeatureLDSBankCount32]>; |
Marek Olsak | 5df00d6 | 2014-12-07 12:18:57 +0000 | [diff] [blame] | 213 | |
Tom Stellard | 3498e4f | 2013-06-07 20:28:55 +0000 | [diff] [blame] | 214 | //===----------------------------------------------------------------------===// |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 215 | |
| 216 | def AMDGPUInstrInfo : InstrInfo { |
| 217 | let guessInstructionProperties = 1; |
Matt Arsenault | 1ecac06 | 2015-02-18 02:15:32 +0000 | [diff] [blame] | 218 | let noNamedPositionallyEncodedOperands = 1; |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 219 | } |
| 220 | |
Tom Stellard | 9d7ddd5 | 2014-11-14 14:08:00 +0000 | [diff] [blame] | 221 | def AMDGPUAsmParser : AsmParser { |
| 222 | // Some of the R600 registers have the same name, so this crashes. |
| 223 | // For example T0_XYZW and T0_XY both have the asm name T0. |
| 224 | let ShouldEmitMatchRegisterName = 0; |
| 225 | } |
| 226 | |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 227 | def AMDGPU : Target { |
| 228 | // Pull in Instruction Info: |
| 229 | let InstructionSet = AMDGPUInstrInfo; |
Tom Stellard | 9d7ddd5 | 2014-11-14 14:08:00 +0000 | [diff] [blame] | 230 | let AssemblyParsers = [AMDGPUAsmParser]; |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 231 | } |
| 232 | |
Tom Stellard | bc5b537 | 2014-06-13 16:38:59 +0000 | [diff] [blame] | 233 | // Dummy Instruction itineraries for pseudo instructions |
| 234 | def ALU_NULL : FuncUnit; |
| 235 | def NullALU : InstrItinClass; |
| 236 | |
Tom Stellard | 0e70de5 | 2014-05-16 20:56:45 +0000 | [diff] [blame] | 237 | //===----------------------------------------------------------------------===// |
| 238 | // Predicate helper class |
| 239 | //===----------------------------------------------------------------------===// |
| 240 | |
Tom Stellard | d1f0f02 | 2015-04-23 19:33:54 +0000 | [diff] [blame] | 241 | def TruePredicate : Predicate<"true">; |
| 242 | def isSICI : Predicate< |
| 243 | "Subtarget->getGeneration() == AMDGPUSubtarget::SOUTHERN_ISLANDS ||" |
| 244 | "Subtarget->getGeneration() == AMDGPUSubtarget::SEA_ISLANDS" |
| 245 | >, AssemblerPredicate<"FeatureGCN1Encoding">; |
| 246 | |
Tom Stellard | 0e70de5 | 2014-05-16 20:56:45 +0000 | [diff] [blame] | 247 | class PredicateControl { |
| 248 | Predicate SubtargetPredicate; |
Tom Stellard | d1f0f02 | 2015-04-23 19:33:54 +0000 | [diff] [blame] | 249 | Predicate SIAssemblerPredicate = isSICI; |
Tom Stellard | d7e6f13 | 2015-04-08 01:09:26 +0000 | [diff] [blame] | 250 | list<Predicate> AssemblerPredicates = []; |
Tom Stellard | d1f0f02 | 2015-04-23 19:33:54 +0000 | [diff] [blame] | 251 | Predicate AssemblerPredicate = TruePredicate; |
Tom Stellard | 0e70de5 | 2014-05-16 20:56:45 +0000 | [diff] [blame] | 252 | list<Predicate> OtherPredicates = []; |
Tom Stellard | d1f0f02 | 2015-04-23 19:33:54 +0000 | [diff] [blame] | 253 | list<Predicate> Predicates = !listconcat([SubtargetPredicate, AssemblerPredicate], |
Tom Stellard | d7e6f13 | 2015-04-08 01:09:26 +0000 | [diff] [blame] | 254 | AssemblerPredicates, |
Tom Stellard | 0e70de5 | 2014-05-16 20:56:45 +0000 | [diff] [blame] | 255 | OtherPredicates); |
| 256 | } |
| 257 | |
Tom Stellard | 75aadc2 | 2012-12-11 21:25:42 +0000 | [diff] [blame] | 258 | // Include AMDGPU TD files |
| 259 | include "R600Schedule.td" |
| 260 | include "SISchedule.td" |
| 261 | include "Processors.td" |
| 262 | include "AMDGPUInstrInfo.td" |
| 263 | include "AMDGPUIntrinsics.td" |
| 264 | include "AMDGPURegisterInfo.td" |
| 265 | include "AMDGPUInstructions.td" |
Christian Konig | 2c8f6d5 | 2013-03-07 09:03:52 +0000 | [diff] [blame] | 266 | include "AMDGPUCallingConv.td" |