| Konstantin Zhuravlyov | a63b0f9 | 2017-10-11 22:18:53 +0000 | [diff] [blame] | 1 | //===--- AMDGPUHSAMetadataStreamer.cpp --------------------------*- C++ -*-===// |
| Konstantin Zhuravlyov | 7498cd6 | 2017-03-22 22:32:22 +0000 | [diff] [blame] | 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
| 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
| 9 | // |
| 10 | /// \file |
| Adrian Prantl | 5f8f34e4 | 2018-05-01 15:54:18 +0000 | [diff] [blame] | 11 | /// AMDGPU HSA Metadata Streamer. |
| Konstantin Zhuravlyov | 7498cd6 | 2017-03-22 22:32:22 +0000 | [diff] [blame] | 12 | /// |
| 13 | // |
| 14 | //===----------------------------------------------------------------------===// |
| 15 | |
| Konstantin Zhuravlyov | a63b0f9 | 2017-10-11 22:18:53 +0000 | [diff] [blame] | 16 | #include "AMDGPUHSAMetadataStreamer.h" |
| Scott Linder | 2ad2c18 | 2018-07-10 17:31:32 +0000 | [diff] [blame] | 17 | #include "AMDGPU.h" |
| 18 | #include "AMDGPUSubtarget.h" |
| 19 | #include "SIMachineFunctionInfo.h" |
| 20 | #include "SIProgramInfo.h" |
| Konstantin Zhuravlyov | f0badd5 | 2018-07-10 16:12:51 +0000 | [diff] [blame] | 21 | #include "Utils/AMDGPUBaseInfo.h" |
| Konstantin Zhuravlyov | 7498cd6 | 2017-03-22 22:32:22 +0000 | [diff] [blame] | 22 | #include "llvm/ADT/StringSwitch.h" |
| 23 | #include "llvm/IR/Constants.h" |
| 24 | #include "llvm/IR/Module.h" |
| Konstantin Zhuravlyov | 1e2b878 | 2017-06-06 18:35:50 +0000 | [diff] [blame] | 25 | #include "llvm/Support/raw_ostream.h" |
| Konstantin Zhuravlyov | 7498cd6 | 2017-03-22 22:32:22 +0000 | [diff] [blame] | 26 | |
| 27 | namespace llvm { |
| 28 | |
| Konstantin Zhuravlyov | a63b0f9 | 2017-10-11 22:18:53 +0000 | [diff] [blame] | 29 | static cl::opt<bool> DumpHSAMetadata( |
| 30 | "amdgpu-dump-hsa-metadata", |
| 31 | cl::desc("Dump AMDGPU HSA Metadata")); |
| 32 | static cl::opt<bool> VerifyHSAMetadata( |
| 33 | "amdgpu-verify-hsa-metadata", |
| 34 | cl::desc("Verify AMDGPU HSA Metadata")); |
| Konstantin Zhuravlyov | 7498cd6 | 2017-03-22 22:32:22 +0000 | [diff] [blame] | 35 | |
| Konstantin Zhuravlyov | 7498cd6 | 2017-03-22 22:32:22 +0000 | [diff] [blame] | 36 | namespace AMDGPU { |
| Konstantin Zhuravlyov | a63b0f9 | 2017-10-11 22:18:53 +0000 | [diff] [blame] | 37 | namespace HSAMD { |
| Konstantin Zhuravlyov | 7498cd6 | 2017-03-22 22:32:22 +0000 | [diff] [blame] | 38 | |
| Konstantin Zhuravlyov | 516651b | 2017-10-11 22:59:35 +0000 | [diff] [blame] | 39 | void MetadataStreamer::dump(StringRef HSAMetadataString) const { |
| 40 | errs() << "AMDGPU HSA Metadata:\n" << HSAMetadataString << '\n'; |
| Konstantin Zhuravlyov | 7498cd6 | 2017-03-22 22:32:22 +0000 | [diff] [blame] | 41 | } |
| 42 | |
| Konstantin Zhuravlyov | 516651b | 2017-10-11 22:59:35 +0000 | [diff] [blame] | 43 | void MetadataStreamer::verify(StringRef HSAMetadataString) const { |
| Konstantin Zhuravlyov | a63b0f9 | 2017-10-11 22:18:53 +0000 | [diff] [blame] | 44 | errs() << "AMDGPU HSA Metadata Parser Test: "; |
| Konstantin Zhuravlyov | 7498cd6 | 2017-03-22 22:32:22 +0000 | [diff] [blame] | 45 | |
| Konstantin Zhuravlyov | 516651b | 2017-10-11 22:59:35 +0000 | [diff] [blame] | 46 | HSAMD::Metadata FromHSAMetadataString; |
| 47 | if (fromString(HSAMetadataString, FromHSAMetadataString)) { |
| Konstantin Zhuravlyov | 7498cd6 | 2017-03-22 22:32:22 +0000 | [diff] [blame] | 48 | errs() << "FAIL\n"; |
| 49 | return; |
| 50 | } |
| 51 | |
| Konstantin Zhuravlyov | 516651b | 2017-10-11 22:59:35 +0000 | [diff] [blame] | 52 | std::string ToHSAMetadataString; |
| 53 | if (toString(FromHSAMetadataString, ToHSAMetadataString)) { |
| Konstantin Zhuravlyov | 7498cd6 | 2017-03-22 22:32:22 +0000 | [diff] [blame] | 54 | errs() << "FAIL\n"; |
| 55 | return; |
| 56 | } |
| 57 | |
| Konstantin Zhuravlyov | 516651b | 2017-10-11 22:59:35 +0000 | [diff] [blame] | 58 | errs() << (HSAMetadataString == ToHSAMetadataString ? "PASS" : "FAIL") |
| 59 | << '\n'; |
| 60 | if (HSAMetadataString != ToHSAMetadataString) { |
| 61 | errs() << "Original input: " << HSAMetadataString << '\n' |
| 62 | << "Produced output: " << ToHSAMetadataString << '\n'; |
| Konstantin Zhuravlyov | 7498cd6 | 2017-03-22 22:32:22 +0000 | [diff] [blame] | 63 | } |
| 64 | } |
| 65 | |
| 66 | AccessQualifier MetadataStreamer::getAccessQualifier(StringRef AccQual) const { |
| 67 | if (AccQual.empty()) |
| 68 | return AccessQualifier::Unknown; |
| 69 | |
| 70 | return StringSwitch<AccessQualifier>(AccQual) |
| 71 | .Case("read_only", AccessQualifier::ReadOnly) |
| 72 | .Case("write_only", AccessQualifier::WriteOnly) |
| 73 | .Case("read_write", AccessQualifier::ReadWrite) |
| 74 | .Default(AccessQualifier::Default); |
| 75 | } |
| 76 | |
| 77 | AddressSpaceQualifier MetadataStreamer::getAddressSpaceQualifer( |
| 78 | unsigned AddressSpace) const { |
| Matt Arsenault | b998674 | 2018-09-10 02:23:30 +0000 | [diff] [blame] | 79 | switch (AddressSpace) { |
| 80 | case AMDGPUAS::PRIVATE_ADDRESS: |
| Konstantin Zhuravlyov | 7498cd6 | 2017-03-22 22:32:22 +0000 | [diff] [blame] | 81 | return AddressSpaceQualifier::Private; |
| Matt Arsenault | b998674 | 2018-09-10 02:23:30 +0000 | [diff] [blame] | 82 | case AMDGPUAS::GLOBAL_ADDRESS: |
| Konstantin Zhuravlyov | 7498cd6 | 2017-03-22 22:32:22 +0000 | [diff] [blame] | 83 | return AddressSpaceQualifier::Global; |
| Matt Arsenault | b998674 | 2018-09-10 02:23:30 +0000 | [diff] [blame] | 84 | case AMDGPUAS::CONSTANT_ADDRESS: |
| Konstantin Zhuravlyov | 7498cd6 | 2017-03-22 22:32:22 +0000 | [diff] [blame] | 85 | return AddressSpaceQualifier::Constant; |
| Matt Arsenault | b998674 | 2018-09-10 02:23:30 +0000 | [diff] [blame] | 86 | case AMDGPUAS::LOCAL_ADDRESS: |
| Konstantin Zhuravlyov | 7498cd6 | 2017-03-22 22:32:22 +0000 | [diff] [blame] | 87 | return AddressSpaceQualifier::Local; |
| Matt Arsenault | b998674 | 2018-09-10 02:23:30 +0000 | [diff] [blame] | 88 | case AMDGPUAS::FLAT_ADDRESS: |
| Konstantin Zhuravlyov | 7498cd6 | 2017-03-22 22:32:22 +0000 | [diff] [blame] | 89 | return AddressSpaceQualifier::Generic; |
| Matt Arsenault | b998674 | 2018-09-10 02:23:30 +0000 | [diff] [blame] | 90 | case AMDGPUAS::REGION_ADDRESS: |
| Konstantin Zhuravlyov | 7498cd6 | 2017-03-22 22:32:22 +0000 | [diff] [blame] | 91 | return AddressSpaceQualifier::Region; |
| Matt Arsenault | b998674 | 2018-09-10 02:23:30 +0000 | [diff] [blame] | 92 | default: |
| 93 | return AddressSpaceQualifier::Unknown; |
| 94 | } |
| Konstantin Zhuravlyov | 7498cd6 | 2017-03-22 22:32:22 +0000 | [diff] [blame] | 95 | } |
| 96 | |
| 97 | ValueKind MetadataStreamer::getValueKind(Type *Ty, StringRef TypeQual, |
| 98 | StringRef BaseTypeName) const { |
| 99 | if (TypeQual.find("pipe") != StringRef::npos) |
| 100 | return ValueKind::Pipe; |
| 101 | |
| 102 | return StringSwitch<ValueKind>(BaseTypeName) |
| Konstantin Zhuravlyov | 54ba431 | 2017-04-25 20:38:26 +0000 | [diff] [blame] | 103 | .Case("image1d_t", ValueKind::Image) |
| 104 | .Case("image1d_array_t", ValueKind::Image) |
| 105 | .Case("image1d_buffer_t", ValueKind::Image) |
| 106 | .Case("image2d_t", ValueKind::Image) |
| 107 | .Case("image2d_array_t", ValueKind::Image) |
| 108 | .Case("image2d_array_depth_t", ValueKind::Image) |
| 109 | .Case("image2d_array_msaa_t", ValueKind::Image) |
| 110 | .Case("image2d_array_msaa_depth_t", ValueKind::Image) |
| 111 | .Case("image2d_depth_t", ValueKind::Image) |
| 112 | .Case("image2d_msaa_t", ValueKind::Image) |
| 113 | .Case("image2d_msaa_depth_t", ValueKind::Image) |
| 114 | .Case("image3d_t", ValueKind::Image) |
| Konstantin Zhuravlyov | 7498cd6 | 2017-03-22 22:32:22 +0000 | [diff] [blame] | 115 | .Case("sampler_t", ValueKind::Sampler) |
| 116 | .Case("queue_t", ValueKind::Queue) |
| Konstantin Zhuravlyov | 7498cd6 | 2017-03-22 22:32:22 +0000 | [diff] [blame] | 117 | .Default(isa<PointerType>(Ty) ? |
| 118 | (Ty->getPointerAddressSpace() == |
| Matt Arsenault | 0da6350 | 2018-08-31 05:49:54 +0000 | [diff] [blame] | 119 | AMDGPUAS::LOCAL_ADDRESS ? |
| Konstantin Zhuravlyov | 7498cd6 | 2017-03-22 22:32:22 +0000 | [diff] [blame] | 120 | ValueKind::DynamicSharedPointer : |
| 121 | ValueKind::GlobalBuffer) : |
| 122 | ValueKind::ByValue); |
| 123 | } |
| 124 | |
| 125 | ValueType MetadataStreamer::getValueType(Type *Ty, StringRef TypeName) const { |
| 126 | switch (Ty->getTypeID()) { |
| 127 | case Type::IntegerTyID: { |
| 128 | auto Signed = !TypeName.startswith("u"); |
| 129 | switch (Ty->getIntegerBitWidth()) { |
| 130 | case 8: |
| 131 | return Signed ? ValueType::I8 : ValueType::U8; |
| 132 | case 16: |
| 133 | return Signed ? ValueType::I16 : ValueType::U16; |
| 134 | case 32: |
| 135 | return Signed ? ValueType::I32 : ValueType::U32; |
| 136 | case 64: |
| 137 | return Signed ? ValueType::I64 : ValueType::U64; |
| 138 | default: |
| 139 | return ValueType::Struct; |
| 140 | } |
| 141 | } |
| 142 | case Type::HalfTyID: |
| 143 | return ValueType::F16; |
| 144 | case Type::FloatTyID: |
| 145 | return ValueType::F32; |
| 146 | case Type::DoubleTyID: |
| 147 | return ValueType::F64; |
| 148 | case Type::PointerTyID: |
| 149 | return getValueType(Ty->getPointerElementType(), TypeName); |
| 150 | case Type::VectorTyID: |
| 151 | return getValueType(Ty->getVectorElementType(), TypeName); |
| 152 | default: |
| 153 | return ValueType::Struct; |
| 154 | } |
| 155 | } |
| 156 | |
| 157 | std::string MetadataStreamer::getTypeName(Type *Ty, bool Signed) const { |
| 158 | switch (Ty->getTypeID()) { |
| 159 | case Type::IntegerTyID: { |
| 160 | if (!Signed) |
| 161 | return (Twine('u') + getTypeName(Ty, true)).str(); |
| 162 | |
| 163 | auto BitWidth = Ty->getIntegerBitWidth(); |
| 164 | switch (BitWidth) { |
| 165 | case 8: |
| 166 | return "char"; |
| 167 | case 16: |
| 168 | return "short"; |
| 169 | case 32: |
| 170 | return "int"; |
| 171 | case 64: |
| 172 | return "long"; |
| 173 | default: |
| 174 | return (Twine('i') + Twine(BitWidth)).str(); |
| 175 | } |
| 176 | } |
| 177 | case Type::HalfTyID: |
| 178 | return "half"; |
| 179 | case Type::FloatTyID: |
| 180 | return "float"; |
| 181 | case Type::DoubleTyID: |
| 182 | return "double"; |
| 183 | case Type::VectorTyID: { |
| 184 | auto VecTy = cast<VectorType>(Ty); |
| 185 | auto ElTy = VecTy->getElementType(); |
| 186 | auto NumElements = VecTy->getVectorNumElements(); |
| 187 | return (Twine(getTypeName(ElTy, Signed)) + Twine(NumElements)).str(); |
| 188 | } |
| 189 | default: |
| 190 | return "unknown"; |
| 191 | } |
| 192 | } |
| 193 | |
| 194 | std::vector<uint32_t> MetadataStreamer::getWorkGroupDimensions( |
| 195 | MDNode *Node) const { |
| 196 | std::vector<uint32_t> Dims; |
| 197 | if (Node->getNumOperands() != 3) |
| 198 | return Dims; |
| 199 | |
| 200 | for (auto &Op : Node->operands()) |
| 201 | Dims.push_back(mdconst::extract<ConstantInt>(Op)->getZExtValue()); |
| 202 | return Dims; |
| 203 | } |
| 204 | |
| Scott Linder | 2ad2c18 | 2018-07-10 17:31:32 +0000 | [diff] [blame] | 205 | Kernel::CodeProps::Metadata MetadataStreamer::getHSACodeProps( |
| 206 | const MachineFunction &MF, |
| 207 | const SIProgramInfo &ProgramInfo) const { |
| Tom Stellard | 5bfbae5 | 2018-07-11 20:59:01 +0000 | [diff] [blame] | 208 | const GCNSubtarget &STM = MF.getSubtarget<GCNSubtarget>(); |
| Scott Linder | 2ad2c18 | 2018-07-10 17:31:32 +0000 | [diff] [blame] | 209 | const SIMachineFunctionInfo &MFI = *MF.getInfo<SIMachineFunctionInfo>(); |
| 210 | HSAMD::Kernel::CodeProps::Metadata HSACodeProps; |
| 211 | const Function &F = MF.getFunction(); |
| 212 | |
| Matt Arsenault | 4bec7d4 | 2018-07-20 09:05:08 +0000 | [diff] [blame] | 213 | assert(F.getCallingConv() == CallingConv::AMDGPU_KERNEL || |
| 214 | F.getCallingConv() == CallingConv::SPIR_KERNEL); |
| Scott Linder | 2ad2c18 | 2018-07-10 17:31:32 +0000 | [diff] [blame] | 215 | |
| Matt Arsenault | 4bec7d4 | 2018-07-20 09:05:08 +0000 | [diff] [blame] | 216 | unsigned MaxKernArgAlign; |
| 217 | HSACodeProps.mKernargSegmentSize = STM.getKernArgSegmentSize(F, |
| 218 | MaxKernArgAlign); |
| Scott Linder | 2ad2c18 | 2018-07-10 17:31:32 +0000 | [diff] [blame] | 219 | HSACodeProps.mGroupSegmentFixedSize = ProgramInfo.LDSSize; |
| 220 | HSACodeProps.mPrivateSegmentFixedSize = ProgramInfo.ScratchSize; |
| Matt Arsenault | 4bec7d4 | 2018-07-20 09:05:08 +0000 | [diff] [blame] | 221 | HSACodeProps.mKernargSegmentAlign = std::max(MaxKernArgAlign, 4u); |
| Scott Linder | 2ad2c18 | 2018-07-10 17:31:32 +0000 | [diff] [blame] | 222 | HSACodeProps.mWavefrontSize = STM.getWavefrontSize(); |
| 223 | HSACodeProps.mNumSGPRs = ProgramInfo.NumSGPR; |
| 224 | HSACodeProps.mNumVGPRs = ProgramInfo.NumVGPR; |
| 225 | HSACodeProps.mMaxFlatWorkGroupSize = MFI.getMaxFlatWorkGroupSize(); |
| 226 | HSACodeProps.mIsDynamicCallStack = ProgramInfo.DynamicCallStack; |
| 227 | HSACodeProps.mIsXNACKEnabled = STM.isXNACKEnabled(); |
| 228 | HSACodeProps.mNumSpilledSGPRs = MFI.getNumSpilledSGPRs(); |
| 229 | HSACodeProps.mNumSpilledVGPRs = MFI.getNumSpilledVGPRs(); |
| 230 | |
| 231 | return HSACodeProps; |
| 232 | } |
| 233 | |
| 234 | Kernel::DebugProps::Metadata MetadataStreamer::getHSADebugProps( |
| 235 | const MachineFunction &MF, |
| 236 | const SIProgramInfo &ProgramInfo) const { |
| Tom Stellard | 5bfbae5 | 2018-07-11 20:59:01 +0000 | [diff] [blame] | 237 | const GCNSubtarget &STM = MF.getSubtarget<GCNSubtarget>(); |
| Scott Linder | 2ad2c18 | 2018-07-10 17:31:32 +0000 | [diff] [blame] | 238 | HSAMD::Kernel::DebugProps::Metadata HSADebugProps; |
| 239 | |
| 240 | if (!STM.debuggerSupported()) |
| 241 | return HSADebugProps; |
| 242 | |
| 243 | HSADebugProps.mDebuggerABIVersion.push_back(1); |
| 244 | HSADebugProps.mDebuggerABIVersion.push_back(0); |
| 245 | |
| 246 | if (STM.debuggerEmitPrologue()) { |
| 247 | HSADebugProps.mPrivateSegmentBufferSGPR = |
| 248 | ProgramInfo.DebuggerPrivateSegmentBufferSGPR; |
| 249 | HSADebugProps.mWavefrontPrivateSegmentOffsetSGPR = |
| 250 | ProgramInfo.DebuggerWavefrontPrivateSegmentOffsetSGPR; |
| 251 | } |
| 252 | |
| 253 | return HSADebugProps; |
| 254 | } |
| 255 | |
| Konstantin Zhuravlyov | 7498cd6 | 2017-03-22 22:32:22 +0000 | [diff] [blame] | 256 | void MetadataStreamer::emitVersion() { |
| Konstantin Zhuravlyov | a63b0f9 | 2017-10-11 22:18:53 +0000 | [diff] [blame] | 257 | auto &Version = HSAMetadata.mVersion; |
| Konstantin Zhuravlyov | 7498cd6 | 2017-03-22 22:32:22 +0000 | [diff] [blame] | 258 | |
| Konstantin Zhuravlyov | a63b0f9 | 2017-10-11 22:18:53 +0000 | [diff] [blame] | 259 | Version.push_back(VersionMajor); |
| 260 | Version.push_back(VersionMinor); |
| Konstantin Zhuravlyov | 7498cd6 | 2017-03-22 22:32:22 +0000 | [diff] [blame] | 261 | } |
| 262 | |
| Konstantin Zhuravlyov | 7498cd6 | 2017-03-22 22:32:22 +0000 | [diff] [blame] | 263 | void MetadataStreamer::emitPrintf(const Module &Mod) { |
| Konstantin Zhuravlyov | a63b0f9 | 2017-10-11 22:18:53 +0000 | [diff] [blame] | 264 | auto &Printf = HSAMetadata.mPrintf; |
| Konstantin Zhuravlyov | 7498cd6 | 2017-03-22 22:32:22 +0000 | [diff] [blame] | 265 | |
| 266 | auto Node = Mod.getNamedMetadata("llvm.printf.fmts"); |
| 267 | if (!Node) |
| 268 | return; |
| 269 | |
| 270 | for (auto Op : Node->operands()) |
| 271 | if (Op->getNumOperands()) |
| 272 | Printf.push_back(cast<MDString>(Op->getOperand(0))->getString()); |
| 273 | } |
| 274 | |
| 275 | void MetadataStreamer::emitKernelLanguage(const Function &Func) { |
| Konstantin Zhuravlyov | a63b0f9 | 2017-10-11 22:18:53 +0000 | [diff] [blame] | 276 | auto &Kernel = HSAMetadata.mKernels.back(); |
| Konstantin Zhuravlyov | 7498cd6 | 2017-03-22 22:32:22 +0000 | [diff] [blame] | 277 | |
| 278 | // TODO: What about other languages? |
| 279 | auto Node = Func.getParent()->getNamedMetadata("opencl.ocl.version"); |
| 280 | if (!Node || !Node->getNumOperands()) |
| 281 | return; |
| 282 | auto Op0 = Node->getOperand(0); |
| 283 | if (Op0->getNumOperands() <= 1) |
| 284 | return; |
| 285 | |
| 286 | Kernel.mLanguage = "OpenCL C"; |
| 287 | Kernel.mLanguageVersion.push_back( |
| 288 | mdconst::extract<ConstantInt>(Op0->getOperand(0))->getZExtValue()); |
| 289 | Kernel.mLanguageVersion.push_back( |
| 290 | mdconst::extract<ConstantInt>(Op0->getOperand(1))->getZExtValue()); |
| 291 | } |
| 292 | |
| 293 | void MetadataStreamer::emitKernelAttrs(const Function &Func) { |
| Konstantin Zhuravlyov | a63b0f9 | 2017-10-11 22:18:53 +0000 | [diff] [blame] | 294 | auto &Attrs = HSAMetadata.mKernels.back().mAttrs; |
| Konstantin Zhuravlyov | 7498cd6 | 2017-03-22 22:32:22 +0000 | [diff] [blame] | 295 | |
| 296 | if (auto Node = Func.getMetadata("reqd_work_group_size")) |
| 297 | Attrs.mReqdWorkGroupSize = getWorkGroupDimensions(Node); |
| 298 | if (auto Node = Func.getMetadata("work_group_size_hint")) |
| 299 | Attrs.mWorkGroupSizeHint = getWorkGroupDimensions(Node); |
| 300 | if (auto Node = Func.getMetadata("vec_type_hint")) { |
| 301 | Attrs.mVecTypeHint = getTypeName( |
| 302 | cast<ValueAsMetadata>(Node->getOperand(0))->getType(), |
| 303 | mdconst::extract<ConstantInt>(Node->getOperand(1))->getZExtValue()); |
| 304 | } |
| Yaxun Liu | de4b88d | 2017-10-10 19:39:48 +0000 | [diff] [blame] | 305 | if (Func.hasFnAttribute("runtime-handle")) { |
| 306 | Attrs.mRuntimeHandle = |
| 307 | Func.getFnAttribute("runtime-handle").getValueAsString().str(); |
| 308 | } |
| Konstantin Zhuravlyov | 7498cd6 | 2017-03-22 22:32:22 +0000 | [diff] [blame] | 309 | } |
| 310 | |
| 311 | void MetadataStreamer::emitKernelArgs(const Function &Func) { |
| 312 | for (auto &Arg : Func.args()) |
| 313 | emitKernelArg(Arg); |
| 314 | |
| Konstantin Zhuravlyov | f0badd5 | 2018-07-10 16:12:51 +0000 | [diff] [blame] | 315 | emitHiddenKernelArgs(Func); |
| Konstantin Zhuravlyov | 7498cd6 | 2017-03-22 22:32:22 +0000 | [diff] [blame] | 316 | } |
| 317 | |
| 318 | void MetadataStreamer::emitKernelArg(const Argument &Arg) { |
| 319 | auto Func = Arg.getParent(); |
| 320 | auto ArgNo = Arg.getArgNo(); |
| 321 | const MDNode *Node; |
| 322 | |
| Konstantin Zhuravlyov | a01d8b0 | 2017-10-14 19:03:51 +0000 | [diff] [blame] | 323 | StringRef Name; |
| 324 | Node = Func->getMetadata("kernel_arg_name"); |
| Konstantin Zhuravlyov | 7498cd6 | 2017-03-22 22:32:22 +0000 | [diff] [blame] | 325 | if (Node && ArgNo < Node->getNumOperands()) |
| Konstantin Zhuravlyov | a01d8b0 | 2017-10-14 19:03:51 +0000 | [diff] [blame] | 326 | Name = cast<MDString>(Node->getOperand(ArgNo))->getString(); |
| Konstantin Zhuravlyov | e30f88f | 2017-12-08 19:22:12 +0000 | [diff] [blame] | 327 | else if (Arg.hasName()) |
| 328 | Name = Arg.getName(); |
| Konstantin Zhuravlyov | a01d8b0 | 2017-10-14 19:03:51 +0000 | [diff] [blame] | 329 | |
| 330 | StringRef TypeName; |
| 331 | Node = Func->getMetadata("kernel_arg_type"); |
| 332 | if (Node && ArgNo < Node->getNumOperands()) |
| 333 | TypeName = cast<MDString>(Node->getOperand(ArgNo))->getString(); |
| Konstantin Zhuravlyov | 7498cd6 | 2017-03-22 22:32:22 +0000 | [diff] [blame] | 334 | |
| 335 | StringRef BaseTypeName; |
| 336 | Node = Func->getMetadata("kernel_arg_base_type"); |
| 337 | if (Node && ArgNo < Node->getNumOperands()) |
| 338 | BaseTypeName = cast<MDString>(Node->getOperand(ArgNo))->getString(); |
| 339 | |
| 340 | StringRef AccQual; |
| Stanislav Mekhanoshin | eff0bc7 | 2017-04-14 19:11:40 +0000 | [diff] [blame] | 341 | if (Arg.getType()->isPointerTy() && Arg.onlyReadsMemory() && |
| 342 | Arg.hasNoAliasAttr()) { |
| 343 | AccQual = "read_only"; |
| 344 | } else { |
| 345 | Node = Func->getMetadata("kernel_arg_access_qual"); |
| 346 | if (Node && ArgNo < Node->getNumOperands()) |
| 347 | AccQual = cast<MDString>(Node->getOperand(ArgNo))->getString(); |
| 348 | } |
| Konstantin Zhuravlyov | 7498cd6 | 2017-03-22 22:32:22 +0000 | [diff] [blame] | 349 | |
| Konstantin Zhuravlyov | a01d8b0 | 2017-10-14 19:03:51 +0000 | [diff] [blame] | 350 | StringRef TypeQual; |
| 351 | Node = Func->getMetadata("kernel_arg_type_qual"); |
| Konstantin Zhuravlyov | 7498cd6 | 2017-03-22 22:32:22 +0000 | [diff] [blame] | 352 | if (Node && ArgNo < Node->getNumOperands()) |
| Konstantin Zhuravlyov | a01d8b0 | 2017-10-14 19:03:51 +0000 | [diff] [blame] | 353 | TypeQual = cast<MDString>(Node->getOperand(ArgNo))->getString(); |
| Konstantin Zhuravlyov | 7498cd6 | 2017-03-22 22:32:22 +0000 | [diff] [blame] | 354 | |
| Matt Arsenault | 73eeb42 | 2018-06-25 14:29:04 +0000 | [diff] [blame] | 355 | Type *Ty = Arg.getType(); |
| 356 | const DataLayout &DL = Func->getParent()->getDataLayout(); |
| 357 | |
| 358 | unsigned PointeeAlign = 0; |
| 359 | if (auto PtrTy = dyn_cast<PointerType>(Ty)) { |
| Matt Arsenault | 0da6350 | 2018-08-31 05:49:54 +0000 | [diff] [blame] | 360 | if (PtrTy->getAddressSpace() == AMDGPUAS::LOCAL_ADDRESS) { |
| Matt Arsenault | 73eeb42 | 2018-06-25 14:29:04 +0000 | [diff] [blame] | 361 | PointeeAlign = Arg.getParamAlignment(); |
| 362 | if (PointeeAlign == 0) |
| 363 | PointeeAlign = DL.getABITypeAlignment(PtrTy->getElementType()); |
| 364 | } |
| 365 | } |
| 366 | |
| 367 | emitKernelArg(DL, Ty, getValueKind(Arg.getType(), TypeQual, BaseTypeName), |
| 368 | PointeeAlign, Name, TypeName, BaseTypeName, AccQual, TypeQual); |
| Konstantin Zhuravlyov | 7498cd6 | 2017-03-22 22:32:22 +0000 | [diff] [blame] | 369 | } |
| 370 | |
| 371 | void MetadataStreamer::emitKernelArg(const DataLayout &DL, Type *Ty, |
| Matt Arsenault | 73eeb42 | 2018-06-25 14:29:04 +0000 | [diff] [blame] | 372 | ValueKind ValueKind, |
| 373 | unsigned PointeeAlign, |
| 374 | StringRef Name, |
| Konstantin Zhuravlyov | a01d8b0 | 2017-10-14 19:03:51 +0000 | [diff] [blame] | 375 | StringRef TypeName, StringRef BaseTypeName, |
| 376 | StringRef AccQual, StringRef TypeQual) { |
| Konstantin Zhuravlyov | a63b0f9 | 2017-10-11 22:18:53 +0000 | [diff] [blame] | 377 | HSAMetadata.mKernels.back().mArgs.push_back(Kernel::Arg::Metadata()); |
| 378 | auto &Arg = HSAMetadata.mKernels.back().mArgs.back(); |
| Konstantin Zhuravlyov | 7498cd6 | 2017-03-22 22:32:22 +0000 | [diff] [blame] | 379 | |
| Konstantin Zhuravlyov | a01d8b0 | 2017-10-14 19:03:51 +0000 | [diff] [blame] | 380 | Arg.mName = Name; |
| 381 | Arg.mTypeName = TypeName; |
| Konstantin Zhuravlyov | 7498cd6 | 2017-03-22 22:32:22 +0000 | [diff] [blame] | 382 | Arg.mSize = DL.getTypeAllocSize(Ty); |
| 383 | Arg.mAlign = DL.getABITypeAlignment(Ty); |
| 384 | Arg.mValueKind = ValueKind; |
| 385 | Arg.mValueType = getValueType(Ty, BaseTypeName); |
| Matt Arsenault | 73eeb42 | 2018-06-25 14:29:04 +0000 | [diff] [blame] | 386 | Arg.mPointeeAlign = PointeeAlign; |
| Konstantin Zhuravlyov | 7498cd6 | 2017-03-22 22:32:22 +0000 | [diff] [blame] | 387 | |
| Konstantin Zhuravlyov | 7498cd6 | 2017-03-22 22:32:22 +0000 | [diff] [blame] | 388 | if (auto PtrTy = dyn_cast<PointerType>(Ty)) |
| 389 | Arg.mAddrSpaceQual = getAddressSpaceQualifer(PtrTy->getAddressSpace()); |
| 390 | |
| Konstantin Zhuravlyov | a01d8b0 | 2017-10-14 19:03:51 +0000 | [diff] [blame] | 391 | Arg.mAccQual = getAccessQualifier(AccQual); |
| 392 | |
| 393 | // TODO: Emit Arg.mActualAccQual. |
| 394 | |
| Konstantin Zhuravlyov | 7498cd6 | 2017-03-22 22:32:22 +0000 | [diff] [blame] | 395 | SmallVector<StringRef, 1> SplitTypeQuals; |
| 396 | TypeQual.split(SplitTypeQuals, " ", -1, false); |
| 397 | for (StringRef Key : SplitTypeQuals) { |
| 398 | auto P = StringSwitch<bool*>(Key) |
| 399 | .Case("const", &Arg.mIsConst) |
| Konstantin Zhuravlyov | 7498cd6 | 2017-03-22 22:32:22 +0000 | [diff] [blame] | 400 | .Case("restrict", &Arg.mIsRestrict) |
| 401 | .Case("volatile", &Arg.mIsVolatile) |
| Konstantin Zhuravlyov | a01d8b0 | 2017-10-14 19:03:51 +0000 | [diff] [blame] | 402 | .Case("pipe", &Arg.mIsPipe) |
| Konstantin Zhuravlyov | 7498cd6 | 2017-03-22 22:32:22 +0000 | [diff] [blame] | 403 | .Default(nullptr); |
| 404 | if (P) |
| 405 | *P = true; |
| 406 | } |
| Konstantin Zhuravlyov | a780ffa | 2017-03-22 23:10:46 +0000 | [diff] [blame] | 407 | } |
| 408 | |
| Konstantin Zhuravlyov | f0badd5 | 2018-07-10 16:12:51 +0000 | [diff] [blame] | 409 | void MetadataStreamer::emitHiddenKernelArgs(const Function &Func) { |
| 410 | int HiddenArgNumBytes = |
| 411 | getIntegerAttribute(Func, "amdgpu-implicitarg-num-bytes", 0); |
| 412 | |
| 413 | if (!HiddenArgNumBytes) |
| 414 | return; |
| 415 | |
| 416 | auto &DL = Func.getParent()->getDataLayout(); |
| 417 | auto Int64Ty = Type::getInt64Ty(Func.getContext()); |
| 418 | |
| 419 | if (HiddenArgNumBytes >= 8) |
| 420 | emitKernelArg(DL, Int64Ty, ValueKind::HiddenGlobalOffsetX); |
| 421 | if (HiddenArgNumBytes >= 16) |
| 422 | emitKernelArg(DL, Int64Ty, ValueKind::HiddenGlobalOffsetY); |
| 423 | if (HiddenArgNumBytes >= 24) |
| 424 | emitKernelArg(DL, Int64Ty, ValueKind::HiddenGlobalOffsetZ); |
| 425 | |
| 426 | auto Int8PtrTy = Type::getInt8PtrTy(Func.getContext(), |
| Matt Arsenault | 0da6350 | 2018-08-31 05:49:54 +0000 | [diff] [blame] | 427 | AMDGPUAS::GLOBAL_ADDRESS); |
| Konstantin Zhuravlyov | f0badd5 | 2018-07-10 16:12:51 +0000 | [diff] [blame] | 428 | |
| 429 | // Emit "printf buffer" argument if printf is used, otherwise emit dummy |
| 430 | // "none" argument. |
| 431 | if (HiddenArgNumBytes >= 32) { |
| 432 | if (Func.getParent()->getNamedMetadata("llvm.printf.fmts")) |
| 433 | emitKernelArg(DL, Int8PtrTy, ValueKind::HiddenPrintfBuffer); |
| 434 | else |
| 435 | emitKernelArg(DL, Int8PtrTy, ValueKind::HiddenNone); |
| 436 | } |
| 437 | |
| 438 | // Emit "default queue" and "completion action" arguments if enqueue kernel is |
| 439 | // used, otherwise emit dummy "none" arguments. |
| 440 | if (HiddenArgNumBytes >= 48) { |
| 441 | if (Func.hasFnAttribute("calls-enqueue-kernel")) { |
| 442 | emitKernelArg(DL, Int8PtrTy, ValueKind::HiddenDefaultQueue); |
| 443 | emitKernelArg(DL, Int8PtrTy, ValueKind::HiddenCompletionAction); |
| 444 | } else { |
| 445 | emitKernelArg(DL, Int8PtrTy, ValueKind::HiddenNone); |
| 446 | emitKernelArg(DL, Int8PtrTy, ValueKind::HiddenNone); |
| 447 | } |
| 448 | } |
| 449 | } |
| 450 | |
| Konstantin Zhuravlyov | 4cbb689 | 2017-03-22 23:27:09 +0000 | [diff] [blame] | 451 | void MetadataStreamer::begin(const Module &Mod) { |
| Konstantin Zhuravlyov | 7498cd6 | 2017-03-22 22:32:22 +0000 | [diff] [blame] | 452 | emitVersion(); |
| Konstantin Zhuravlyov | 7498cd6 | 2017-03-22 22:32:22 +0000 | [diff] [blame] | 453 | emitPrintf(Mod); |
| 454 | } |
| 455 | |
| Konstantin Zhuravlyov | 516651b | 2017-10-11 22:59:35 +0000 | [diff] [blame] | 456 | void MetadataStreamer::end() { |
| 457 | std::string HSAMetadataString; |
| Konstantin Zhuravlyov | 63e87f5 | 2017-10-12 17:34:05 +0000 | [diff] [blame] | 458 | if (toString(HSAMetadata, HSAMetadataString)) |
| Konstantin Zhuravlyov | 516651b | 2017-10-11 22:59:35 +0000 | [diff] [blame] | 459 | return; |
| 460 | |
| 461 | if (DumpHSAMetadata) |
| 462 | dump(HSAMetadataString); |
| 463 | if (VerifyHSAMetadata) |
| 464 | verify(HSAMetadataString); |
| 465 | } |
| 466 | |
| Scott Linder | 2ad2c18 | 2018-07-10 17:31:32 +0000 | [diff] [blame] | 467 | void MetadataStreamer::emitKernel(const MachineFunction &MF, const SIProgramInfo &ProgramInfo) { |
| 468 | auto &Func = MF.getFunction(); |
| Konstantin Zhuravlyov | 7498cd6 | 2017-03-22 22:32:22 +0000 | [diff] [blame] | 469 | if (Func.getCallingConv() != CallingConv::AMDGPU_KERNEL) |
| 470 | return; |
| 471 | |
| Matt Arsenault | 4bec7d4 | 2018-07-20 09:05:08 +0000 | [diff] [blame] | 472 | auto CodeProps = getHSACodeProps(MF, ProgramInfo); |
| 473 | auto DebugProps = getHSADebugProps(MF, ProgramInfo); |
| 474 | |
| Konstantin Zhuravlyov | a63b0f9 | 2017-10-11 22:18:53 +0000 | [diff] [blame] | 475 | HSAMetadata.mKernels.push_back(Kernel::Metadata()); |
| 476 | auto &Kernel = HSAMetadata.mKernels.back(); |
| Konstantin Zhuravlyov | 7498cd6 | 2017-03-22 22:32:22 +0000 | [diff] [blame] | 477 | |
| 478 | Kernel.mName = Func.getName(); |
| Konstantin Zhuravlyov | a01d8b0 | 2017-10-14 19:03:51 +0000 | [diff] [blame] | 479 | Kernel.mSymbolName = (Twine(Func.getName()) + Twine("@kd")).str(); |
| Konstantin Zhuravlyov | 7498cd6 | 2017-03-22 22:32:22 +0000 | [diff] [blame] | 480 | emitKernelLanguage(Func); |
| 481 | emitKernelAttrs(Func); |
| 482 | emitKernelArgs(Func); |
| Konstantin Zhuravlyov | a01d8b0 | 2017-10-14 19:03:51 +0000 | [diff] [blame] | 483 | HSAMetadata.mKernels.back().mCodeProps = CodeProps; |
| 484 | HSAMetadata.mKernels.back().mDebugProps = DebugProps; |
| Konstantin Zhuravlyov | 7498cd6 | 2017-03-22 22:32:22 +0000 | [diff] [blame] | 485 | } |
| 486 | |
| Konstantin Zhuravlyov | a63b0f9 | 2017-10-11 22:18:53 +0000 | [diff] [blame] | 487 | } // end namespace HSAMD |
| Konstantin Zhuravlyov | 7498cd6 | 2017-03-22 22:32:22 +0000 | [diff] [blame] | 488 | } // end namespace AMDGPU |
| 489 | } // end namespace llvm |