xref: /freebsd/contrib/llvm-project/llvm/lib/Target/AMDGPU/AMDGPUHSAMetadataStreamer.cpp (revision 5ffd83dbcc34f10e07f6d3e968ae6365869615f4)
10b57cec5SDimitry Andric //===--- AMDGPUHSAMetadataStreamer.cpp --------------------------*- C++ -*-===//
20b57cec5SDimitry Andric //
30b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
40b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information.
50b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
60b57cec5SDimitry Andric //
70b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
80b57cec5SDimitry Andric //
90b57cec5SDimitry Andric /// \file
100b57cec5SDimitry Andric /// AMDGPU HSA Metadata Streamer.
110b57cec5SDimitry Andric ///
120b57cec5SDimitry Andric //
130b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
140b57cec5SDimitry Andric 
150b57cec5SDimitry Andric #include "AMDGPUHSAMetadataStreamer.h"
160b57cec5SDimitry Andric #include "AMDGPU.h"
170b57cec5SDimitry Andric #include "AMDGPUSubtarget.h"
180b57cec5SDimitry Andric #include "MCTargetDesc/AMDGPUTargetStreamer.h"
190b57cec5SDimitry Andric #include "SIMachineFunctionInfo.h"
200b57cec5SDimitry Andric #include "SIProgramInfo.h"
210b57cec5SDimitry Andric #include "Utils/AMDGPUBaseInfo.h"
220b57cec5SDimitry Andric #include "llvm/ADT/StringSwitch.h"
230b57cec5SDimitry Andric #include "llvm/IR/Constants.h"
240b57cec5SDimitry Andric #include "llvm/IR/Module.h"
250b57cec5SDimitry Andric #include "llvm/Support/raw_ostream.h"
260b57cec5SDimitry Andric 
270b57cec5SDimitry Andric namespace llvm {
280b57cec5SDimitry Andric 
290b57cec5SDimitry Andric static cl::opt<bool> DumpHSAMetadata(
300b57cec5SDimitry Andric     "amdgpu-dump-hsa-metadata",
310b57cec5SDimitry Andric     cl::desc("Dump AMDGPU HSA Metadata"));
320b57cec5SDimitry Andric static cl::opt<bool> VerifyHSAMetadata(
330b57cec5SDimitry Andric     "amdgpu-verify-hsa-metadata",
340b57cec5SDimitry Andric     cl::desc("Verify AMDGPU HSA Metadata"));
350b57cec5SDimitry Andric 
360b57cec5SDimitry Andric namespace AMDGPU {
370b57cec5SDimitry Andric namespace HSAMD {
380b57cec5SDimitry Andric 
390b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
400b57cec5SDimitry Andric // HSAMetadataStreamerV2
410b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
420b57cec5SDimitry Andric void MetadataStreamerV2::dump(StringRef HSAMetadataString) const {
430b57cec5SDimitry Andric   errs() << "AMDGPU HSA Metadata:\n" << HSAMetadataString << '\n';
440b57cec5SDimitry Andric }
450b57cec5SDimitry Andric 
460b57cec5SDimitry Andric void MetadataStreamerV2::verify(StringRef HSAMetadataString) const {
470b57cec5SDimitry Andric   errs() << "AMDGPU HSA Metadata Parser Test: ";
480b57cec5SDimitry Andric 
490b57cec5SDimitry Andric   HSAMD::Metadata FromHSAMetadataString;
50*5ffd83dbSDimitry Andric   if (fromString(std::string(HSAMetadataString), FromHSAMetadataString)) {
510b57cec5SDimitry Andric     errs() << "FAIL\n";
520b57cec5SDimitry Andric     return;
530b57cec5SDimitry Andric   }
540b57cec5SDimitry Andric 
550b57cec5SDimitry Andric   std::string ToHSAMetadataString;
560b57cec5SDimitry Andric   if (toString(FromHSAMetadataString, ToHSAMetadataString)) {
570b57cec5SDimitry Andric     errs() << "FAIL\n";
580b57cec5SDimitry Andric     return;
590b57cec5SDimitry Andric   }
600b57cec5SDimitry Andric 
610b57cec5SDimitry Andric   errs() << (HSAMetadataString == ToHSAMetadataString ? "PASS" : "FAIL")
620b57cec5SDimitry Andric          << '\n';
630b57cec5SDimitry Andric   if (HSAMetadataString != ToHSAMetadataString) {
640b57cec5SDimitry Andric     errs() << "Original input: " << HSAMetadataString << '\n'
650b57cec5SDimitry Andric            << "Produced output: " << ToHSAMetadataString << '\n';
660b57cec5SDimitry Andric   }
670b57cec5SDimitry Andric }
680b57cec5SDimitry Andric 
690b57cec5SDimitry Andric AccessQualifier
700b57cec5SDimitry Andric MetadataStreamerV2::getAccessQualifier(StringRef AccQual) const {
710b57cec5SDimitry Andric   if (AccQual.empty())
720b57cec5SDimitry Andric     return AccessQualifier::Unknown;
730b57cec5SDimitry Andric 
740b57cec5SDimitry Andric   return StringSwitch<AccessQualifier>(AccQual)
750b57cec5SDimitry Andric              .Case("read_only",  AccessQualifier::ReadOnly)
760b57cec5SDimitry Andric              .Case("write_only", AccessQualifier::WriteOnly)
770b57cec5SDimitry Andric              .Case("read_write", AccessQualifier::ReadWrite)
780b57cec5SDimitry Andric              .Default(AccessQualifier::Default);
790b57cec5SDimitry Andric }
800b57cec5SDimitry Andric 
810b57cec5SDimitry Andric AddressSpaceQualifier
820b57cec5SDimitry Andric MetadataStreamerV2::getAddressSpaceQualifier(
830b57cec5SDimitry Andric     unsigned AddressSpace) const {
840b57cec5SDimitry Andric   switch (AddressSpace) {
850b57cec5SDimitry Andric   case AMDGPUAS::PRIVATE_ADDRESS:
860b57cec5SDimitry Andric     return AddressSpaceQualifier::Private;
870b57cec5SDimitry Andric   case AMDGPUAS::GLOBAL_ADDRESS:
880b57cec5SDimitry Andric     return AddressSpaceQualifier::Global;
890b57cec5SDimitry Andric   case AMDGPUAS::CONSTANT_ADDRESS:
900b57cec5SDimitry Andric     return AddressSpaceQualifier::Constant;
910b57cec5SDimitry Andric   case AMDGPUAS::LOCAL_ADDRESS:
920b57cec5SDimitry Andric     return AddressSpaceQualifier::Local;
930b57cec5SDimitry Andric   case AMDGPUAS::FLAT_ADDRESS:
940b57cec5SDimitry Andric     return AddressSpaceQualifier::Generic;
950b57cec5SDimitry Andric   case AMDGPUAS::REGION_ADDRESS:
960b57cec5SDimitry Andric     return AddressSpaceQualifier::Region;
970b57cec5SDimitry Andric   default:
980b57cec5SDimitry Andric     return AddressSpaceQualifier::Unknown;
990b57cec5SDimitry Andric   }
1000b57cec5SDimitry Andric }
1010b57cec5SDimitry Andric 
1020b57cec5SDimitry Andric ValueKind MetadataStreamerV2::getValueKind(Type *Ty, StringRef TypeQual,
1030b57cec5SDimitry Andric                                            StringRef BaseTypeName) const {
1040b57cec5SDimitry Andric   if (TypeQual.find("pipe") != StringRef::npos)
1050b57cec5SDimitry Andric     return ValueKind::Pipe;
1060b57cec5SDimitry Andric 
1070b57cec5SDimitry Andric   return StringSwitch<ValueKind>(BaseTypeName)
1080b57cec5SDimitry Andric              .Case("image1d_t", ValueKind::Image)
1090b57cec5SDimitry Andric              .Case("image1d_array_t", ValueKind::Image)
1100b57cec5SDimitry Andric              .Case("image1d_buffer_t", ValueKind::Image)
1110b57cec5SDimitry Andric              .Case("image2d_t", ValueKind::Image)
1120b57cec5SDimitry Andric              .Case("image2d_array_t", ValueKind::Image)
1130b57cec5SDimitry Andric              .Case("image2d_array_depth_t", ValueKind::Image)
1140b57cec5SDimitry Andric              .Case("image2d_array_msaa_t", ValueKind::Image)
1150b57cec5SDimitry Andric              .Case("image2d_array_msaa_depth_t", ValueKind::Image)
1160b57cec5SDimitry Andric              .Case("image2d_depth_t", ValueKind::Image)
1170b57cec5SDimitry Andric              .Case("image2d_msaa_t", ValueKind::Image)
1180b57cec5SDimitry Andric              .Case("image2d_msaa_depth_t", ValueKind::Image)
1190b57cec5SDimitry Andric              .Case("image3d_t", ValueKind::Image)
1200b57cec5SDimitry Andric              .Case("sampler_t", ValueKind::Sampler)
1210b57cec5SDimitry Andric              .Case("queue_t", ValueKind::Queue)
1220b57cec5SDimitry Andric              .Default(isa<PointerType>(Ty) ?
1230b57cec5SDimitry Andric                           (Ty->getPointerAddressSpace() ==
1240b57cec5SDimitry Andric                            AMDGPUAS::LOCAL_ADDRESS ?
1250b57cec5SDimitry Andric                            ValueKind::DynamicSharedPointer :
1260b57cec5SDimitry Andric                            ValueKind::GlobalBuffer) :
1270b57cec5SDimitry Andric                       ValueKind::ByValue);
1280b57cec5SDimitry Andric }
1290b57cec5SDimitry Andric 
1300b57cec5SDimitry Andric std::string MetadataStreamerV2::getTypeName(Type *Ty, bool Signed) const {
1310b57cec5SDimitry Andric   switch (Ty->getTypeID()) {
1320b57cec5SDimitry Andric   case Type::IntegerTyID: {
1330b57cec5SDimitry Andric     if (!Signed)
1340b57cec5SDimitry Andric       return (Twine('u') + getTypeName(Ty, true)).str();
1350b57cec5SDimitry Andric 
1360b57cec5SDimitry Andric     auto BitWidth = Ty->getIntegerBitWidth();
1370b57cec5SDimitry Andric     switch (BitWidth) {
1380b57cec5SDimitry Andric     case 8:
1390b57cec5SDimitry Andric       return "char";
1400b57cec5SDimitry Andric     case 16:
1410b57cec5SDimitry Andric       return "short";
1420b57cec5SDimitry Andric     case 32:
1430b57cec5SDimitry Andric       return "int";
1440b57cec5SDimitry Andric     case 64:
1450b57cec5SDimitry Andric       return "long";
1460b57cec5SDimitry Andric     default:
1470b57cec5SDimitry Andric       return (Twine('i') + Twine(BitWidth)).str();
1480b57cec5SDimitry Andric     }
1490b57cec5SDimitry Andric   }
1500b57cec5SDimitry Andric   case Type::HalfTyID:
1510b57cec5SDimitry Andric     return "half";
1520b57cec5SDimitry Andric   case Type::FloatTyID:
1530b57cec5SDimitry Andric     return "float";
1540b57cec5SDimitry Andric   case Type::DoubleTyID:
1550b57cec5SDimitry Andric     return "double";
156*5ffd83dbSDimitry Andric   case Type::FixedVectorTyID: {
157*5ffd83dbSDimitry Andric     auto VecTy = cast<FixedVectorType>(Ty);
1580b57cec5SDimitry Andric     auto ElTy = VecTy->getElementType();
159*5ffd83dbSDimitry Andric     auto NumElements = VecTy->getNumElements();
1600b57cec5SDimitry Andric     return (Twine(getTypeName(ElTy, Signed)) + Twine(NumElements)).str();
1610b57cec5SDimitry Andric   }
1620b57cec5SDimitry Andric   default:
1630b57cec5SDimitry Andric     return "unknown";
1640b57cec5SDimitry Andric   }
1650b57cec5SDimitry Andric }
1660b57cec5SDimitry Andric 
1670b57cec5SDimitry Andric std::vector<uint32_t>
1680b57cec5SDimitry Andric MetadataStreamerV2::getWorkGroupDimensions(MDNode *Node) const {
1690b57cec5SDimitry Andric   std::vector<uint32_t> Dims;
1700b57cec5SDimitry Andric   if (Node->getNumOperands() != 3)
1710b57cec5SDimitry Andric     return Dims;
1720b57cec5SDimitry Andric 
1730b57cec5SDimitry Andric   for (auto &Op : Node->operands())
1740b57cec5SDimitry Andric     Dims.push_back(mdconst::extract<ConstantInt>(Op)->getZExtValue());
1750b57cec5SDimitry Andric   return Dims;
1760b57cec5SDimitry Andric }
1770b57cec5SDimitry Andric 
1780b57cec5SDimitry Andric Kernel::CodeProps::Metadata
1790b57cec5SDimitry Andric MetadataStreamerV2::getHSACodeProps(const MachineFunction &MF,
1800b57cec5SDimitry Andric                                     const SIProgramInfo &ProgramInfo) const {
1810b57cec5SDimitry Andric   const GCNSubtarget &STM = MF.getSubtarget<GCNSubtarget>();
1820b57cec5SDimitry Andric   const SIMachineFunctionInfo &MFI = *MF.getInfo<SIMachineFunctionInfo>();
1830b57cec5SDimitry Andric   HSAMD::Kernel::CodeProps::Metadata HSACodeProps;
1840b57cec5SDimitry Andric   const Function &F = MF.getFunction();
1850b57cec5SDimitry Andric 
1860b57cec5SDimitry Andric   assert(F.getCallingConv() == CallingConv::AMDGPU_KERNEL ||
1870b57cec5SDimitry Andric          F.getCallingConv() == CallingConv::SPIR_KERNEL);
1880b57cec5SDimitry Andric 
1898bcb0991SDimitry Andric   Align MaxKernArgAlign;
1900b57cec5SDimitry Andric   HSACodeProps.mKernargSegmentSize = STM.getKernArgSegmentSize(F,
1910b57cec5SDimitry Andric                                                                MaxKernArgAlign);
1920b57cec5SDimitry Andric   HSACodeProps.mGroupSegmentFixedSize = ProgramInfo.LDSSize;
1930b57cec5SDimitry Andric   HSACodeProps.mPrivateSegmentFixedSize = ProgramInfo.ScratchSize;
1948bcb0991SDimitry Andric   HSACodeProps.mKernargSegmentAlign =
1958bcb0991SDimitry Andric       std::max(MaxKernArgAlign, Align(4)).value();
1960b57cec5SDimitry Andric   HSACodeProps.mWavefrontSize = STM.getWavefrontSize();
1970b57cec5SDimitry Andric   HSACodeProps.mNumSGPRs = ProgramInfo.NumSGPR;
1980b57cec5SDimitry Andric   HSACodeProps.mNumVGPRs = ProgramInfo.NumVGPR;
1990b57cec5SDimitry Andric   HSACodeProps.mMaxFlatWorkGroupSize = MFI.getMaxFlatWorkGroupSize();
2000b57cec5SDimitry Andric   HSACodeProps.mIsDynamicCallStack = ProgramInfo.DynamicCallStack;
2010b57cec5SDimitry Andric   HSACodeProps.mIsXNACKEnabled = STM.isXNACKEnabled();
2020b57cec5SDimitry Andric   HSACodeProps.mNumSpilledSGPRs = MFI.getNumSpilledSGPRs();
2030b57cec5SDimitry Andric   HSACodeProps.mNumSpilledVGPRs = MFI.getNumSpilledVGPRs();
2040b57cec5SDimitry Andric 
2050b57cec5SDimitry Andric   return HSACodeProps;
2060b57cec5SDimitry Andric }
2070b57cec5SDimitry Andric 
2080b57cec5SDimitry Andric Kernel::DebugProps::Metadata
2090b57cec5SDimitry Andric MetadataStreamerV2::getHSADebugProps(const MachineFunction &MF,
2100b57cec5SDimitry Andric                                      const SIProgramInfo &ProgramInfo) const {
2110b57cec5SDimitry Andric   return HSAMD::Kernel::DebugProps::Metadata();
2120b57cec5SDimitry Andric }
2130b57cec5SDimitry Andric 
2140b57cec5SDimitry Andric void MetadataStreamerV2::emitVersion() {
2150b57cec5SDimitry Andric   auto &Version = HSAMetadata.mVersion;
2160b57cec5SDimitry Andric 
2170b57cec5SDimitry Andric   Version.push_back(VersionMajor);
2180b57cec5SDimitry Andric   Version.push_back(VersionMinor);
2190b57cec5SDimitry Andric }
2200b57cec5SDimitry Andric 
2210b57cec5SDimitry Andric void MetadataStreamerV2::emitPrintf(const Module &Mod) {
2220b57cec5SDimitry Andric   auto &Printf = HSAMetadata.mPrintf;
2230b57cec5SDimitry Andric 
2240b57cec5SDimitry Andric   auto Node = Mod.getNamedMetadata("llvm.printf.fmts");
2250b57cec5SDimitry Andric   if (!Node)
2260b57cec5SDimitry Andric     return;
2270b57cec5SDimitry Andric 
2280b57cec5SDimitry Andric   for (auto Op : Node->operands())
2290b57cec5SDimitry Andric     if (Op->getNumOperands())
230*5ffd83dbSDimitry Andric       Printf.push_back(
231*5ffd83dbSDimitry Andric           std::string(cast<MDString>(Op->getOperand(0))->getString()));
2320b57cec5SDimitry Andric }
2330b57cec5SDimitry Andric 
2340b57cec5SDimitry Andric void MetadataStreamerV2::emitKernelLanguage(const Function &Func) {
2350b57cec5SDimitry Andric   auto &Kernel = HSAMetadata.mKernels.back();
2360b57cec5SDimitry Andric 
2370b57cec5SDimitry Andric   // TODO: What about other languages?
2380b57cec5SDimitry Andric   auto Node = Func.getParent()->getNamedMetadata("opencl.ocl.version");
2390b57cec5SDimitry Andric   if (!Node || !Node->getNumOperands())
2400b57cec5SDimitry Andric     return;
2410b57cec5SDimitry Andric   auto Op0 = Node->getOperand(0);
2420b57cec5SDimitry Andric   if (Op0->getNumOperands() <= 1)
2430b57cec5SDimitry Andric     return;
2440b57cec5SDimitry Andric 
2450b57cec5SDimitry Andric   Kernel.mLanguage = "OpenCL C";
2460b57cec5SDimitry Andric   Kernel.mLanguageVersion.push_back(
2470b57cec5SDimitry Andric       mdconst::extract<ConstantInt>(Op0->getOperand(0))->getZExtValue());
2480b57cec5SDimitry Andric   Kernel.mLanguageVersion.push_back(
2490b57cec5SDimitry Andric       mdconst::extract<ConstantInt>(Op0->getOperand(1))->getZExtValue());
2500b57cec5SDimitry Andric }
2510b57cec5SDimitry Andric 
2520b57cec5SDimitry Andric void MetadataStreamerV2::emitKernelAttrs(const Function &Func) {
2530b57cec5SDimitry Andric   auto &Attrs = HSAMetadata.mKernels.back().mAttrs;
2540b57cec5SDimitry Andric 
2550b57cec5SDimitry Andric   if (auto Node = Func.getMetadata("reqd_work_group_size"))
2560b57cec5SDimitry Andric     Attrs.mReqdWorkGroupSize = getWorkGroupDimensions(Node);
2570b57cec5SDimitry Andric   if (auto Node = Func.getMetadata("work_group_size_hint"))
2580b57cec5SDimitry Andric     Attrs.mWorkGroupSizeHint = getWorkGroupDimensions(Node);
2590b57cec5SDimitry Andric   if (auto Node = Func.getMetadata("vec_type_hint")) {
2600b57cec5SDimitry Andric     Attrs.mVecTypeHint = getTypeName(
2610b57cec5SDimitry Andric         cast<ValueAsMetadata>(Node->getOperand(0))->getType(),
2620b57cec5SDimitry Andric         mdconst::extract<ConstantInt>(Node->getOperand(1))->getZExtValue());
2630b57cec5SDimitry Andric   }
2640b57cec5SDimitry Andric   if (Func.hasFnAttribute("runtime-handle")) {
2650b57cec5SDimitry Andric     Attrs.mRuntimeHandle =
2660b57cec5SDimitry Andric         Func.getFnAttribute("runtime-handle").getValueAsString().str();
2670b57cec5SDimitry Andric   }
2680b57cec5SDimitry Andric }
2690b57cec5SDimitry Andric 
2700b57cec5SDimitry Andric void MetadataStreamerV2::emitKernelArgs(const Function &Func) {
2710b57cec5SDimitry Andric   for (auto &Arg : Func.args())
2720b57cec5SDimitry Andric     emitKernelArg(Arg);
2730b57cec5SDimitry Andric 
2740b57cec5SDimitry Andric   emitHiddenKernelArgs(Func);
2750b57cec5SDimitry Andric }
2760b57cec5SDimitry Andric 
2770b57cec5SDimitry Andric void MetadataStreamerV2::emitKernelArg(const Argument &Arg) {
2780b57cec5SDimitry Andric   auto Func = Arg.getParent();
2790b57cec5SDimitry Andric   auto ArgNo = Arg.getArgNo();
2800b57cec5SDimitry Andric   const MDNode *Node;
2810b57cec5SDimitry Andric 
2820b57cec5SDimitry Andric   StringRef Name;
2830b57cec5SDimitry Andric   Node = Func->getMetadata("kernel_arg_name");
2840b57cec5SDimitry Andric   if (Node && ArgNo < Node->getNumOperands())
2850b57cec5SDimitry Andric     Name = cast<MDString>(Node->getOperand(ArgNo))->getString();
2860b57cec5SDimitry Andric   else if (Arg.hasName())
2870b57cec5SDimitry Andric     Name = Arg.getName();
2880b57cec5SDimitry Andric 
2890b57cec5SDimitry Andric   StringRef TypeName;
2900b57cec5SDimitry Andric   Node = Func->getMetadata("kernel_arg_type");
2910b57cec5SDimitry Andric   if (Node && ArgNo < Node->getNumOperands())
2920b57cec5SDimitry Andric     TypeName = cast<MDString>(Node->getOperand(ArgNo))->getString();
2930b57cec5SDimitry Andric 
2940b57cec5SDimitry Andric   StringRef BaseTypeName;
2950b57cec5SDimitry Andric   Node = Func->getMetadata("kernel_arg_base_type");
2960b57cec5SDimitry Andric   if (Node && ArgNo < Node->getNumOperands())
2970b57cec5SDimitry Andric     BaseTypeName = cast<MDString>(Node->getOperand(ArgNo))->getString();
2980b57cec5SDimitry Andric 
2990b57cec5SDimitry Andric   StringRef AccQual;
3000b57cec5SDimitry Andric   if (Arg.getType()->isPointerTy() && Arg.onlyReadsMemory() &&
3010b57cec5SDimitry Andric       Arg.hasNoAliasAttr()) {
3020b57cec5SDimitry Andric     AccQual = "read_only";
3030b57cec5SDimitry Andric   } else {
3040b57cec5SDimitry Andric     Node = Func->getMetadata("kernel_arg_access_qual");
3050b57cec5SDimitry Andric     if (Node && ArgNo < Node->getNumOperands())
3060b57cec5SDimitry Andric       AccQual = cast<MDString>(Node->getOperand(ArgNo))->getString();
3070b57cec5SDimitry Andric   }
3080b57cec5SDimitry Andric 
3090b57cec5SDimitry Andric   StringRef TypeQual;
3100b57cec5SDimitry Andric   Node = Func->getMetadata("kernel_arg_type_qual");
3110b57cec5SDimitry Andric   if (Node && ArgNo < Node->getNumOperands())
3120b57cec5SDimitry Andric     TypeQual = cast<MDString>(Node->getOperand(ArgNo))->getString();
3130b57cec5SDimitry Andric 
3140b57cec5SDimitry Andric   Type *Ty = Arg.getType();
3150b57cec5SDimitry Andric   const DataLayout &DL = Func->getParent()->getDataLayout();
3160b57cec5SDimitry Andric 
317*5ffd83dbSDimitry Andric   MaybeAlign PointeeAlign;
3180b57cec5SDimitry Andric   if (auto PtrTy = dyn_cast<PointerType>(Ty)) {
3190b57cec5SDimitry Andric     if (PtrTy->getAddressSpace() == AMDGPUAS::LOCAL_ADDRESS) {
320*5ffd83dbSDimitry Andric       PointeeAlign = DL.getValueOrABITypeAlignment(Arg.getParamAlign(),
321*5ffd83dbSDimitry Andric                                                    PtrTy->getElementType());
3220b57cec5SDimitry Andric     }
3230b57cec5SDimitry Andric   }
3240b57cec5SDimitry Andric 
3250b57cec5SDimitry Andric   emitKernelArg(DL, Ty, getValueKind(Arg.getType(), TypeQual, BaseTypeName),
3260b57cec5SDimitry Andric                 PointeeAlign, Name, TypeName, BaseTypeName, AccQual, TypeQual);
3270b57cec5SDimitry Andric }
3280b57cec5SDimitry Andric 
3290b57cec5SDimitry Andric void MetadataStreamerV2::emitKernelArg(const DataLayout &DL, Type *Ty,
3300b57cec5SDimitry Andric                                        ValueKind ValueKind,
331*5ffd83dbSDimitry Andric                                        MaybeAlign PointeeAlign, StringRef Name,
3320b57cec5SDimitry Andric                                        StringRef TypeName,
3330b57cec5SDimitry Andric                                        StringRef BaseTypeName,
3340b57cec5SDimitry Andric                                        StringRef AccQual, StringRef TypeQual) {
3350b57cec5SDimitry Andric   HSAMetadata.mKernels.back().mArgs.push_back(Kernel::Arg::Metadata());
3360b57cec5SDimitry Andric   auto &Arg = HSAMetadata.mKernels.back().mArgs.back();
3370b57cec5SDimitry Andric 
338*5ffd83dbSDimitry Andric   Arg.mName = std::string(Name);
339*5ffd83dbSDimitry Andric   Arg.mTypeName = std::string(TypeName);
3400b57cec5SDimitry Andric   Arg.mSize = DL.getTypeAllocSize(Ty);
341*5ffd83dbSDimitry Andric   Arg.mAlign = DL.getABITypeAlign(Ty).value();
3420b57cec5SDimitry Andric   Arg.mValueKind = ValueKind;
343*5ffd83dbSDimitry Andric   Arg.mPointeeAlign = PointeeAlign ? PointeeAlign->value() : 0;
3440b57cec5SDimitry Andric 
3450b57cec5SDimitry Andric   if (auto PtrTy = dyn_cast<PointerType>(Ty))
3460b57cec5SDimitry Andric     Arg.mAddrSpaceQual = getAddressSpaceQualifier(PtrTy->getAddressSpace());
3470b57cec5SDimitry Andric 
3480b57cec5SDimitry Andric   Arg.mAccQual = getAccessQualifier(AccQual);
3490b57cec5SDimitry Andric 
3500b57cec5SDimitry Andric   // TODO: Emit Arg.mActualAccQual.
3510b57cec5SDimitry Andric 
3520b57cec5SDimitry Andric   SmallVector<StringRef, 1> SplitTypeQuals;
3530b57cec5SDimitry Andric   TypeQual.split(SplitTypeQuals, " ", -1, false);
3540b57cec5SDimitry Andric   for (StringRef Key : SplitTypeQuals) {
3550b57cec5SDimitry Andric     auto P = StringSwitch<bool*>(Key)
3560b57cec5SDimitry Andric                  .Case("const",    &Arg.mIsConst)
3570b57cec5SDimitry Andric                  .Case("restrict", &Arg.mIsRestrict)
3580b57cec5SDimitry Andric                  .Case("volatile", &Arg.mIsVolatile)
3590b57cec5SDimitry Andric                  .Case("pipe",     &Arg.mIsPipe)
3600b57cec5SDimitry Andric                  .Default(nullptr);
3610b57cec5SDimitry Andric     if (P)
3620b57cec5SDimitry Andric       *P = true;
3630b57cec5SDimitry Andric   }
3640b57cec5SDimitry Andric }
3650b57cec5SDimitry Andric 
3660b57cec5SDimitry Andric void MetadataStreamerV2::emitHiddenKernelArgs(const Function &Func) {
3670b57cec5SDimitry Andric   int HiddenArgNumBytes =
3680b57cec5SDimitry Andric       getIntegerAttribute(Func, "amdgpu-implicitarg-num-bytes", 0);
3690b57cec5SDimitry Andric 
3700b57cec5SDimitry Andric   if (!HiddenArgNumBytes)
3710b57cec5SDimitry Andric     return;
3720b57cec5SDimitry Andric 
3730b57cec5SDimitry Andric   auto &DL = Func.getParent()->getDataLayout();
3740b57cec5SDimitry Andric   auto Int64Ty = Type::getInt64Ty(Func.getContext());
3750b57cec5SDimitry Andric 
3760b57cec5SDimitry Andric   if (HiddenArgNumBytes >= 8)
3770b57cec5SDimitry Andric     emitKernelArg(DL, Int64Ty, ValueKind::HiddenGlobalOffsetX);
3780b57cec5SDimitry Andric   if (HiddenArgNumBytes >= 16)
3790b57cec5SDimitry Andric     emitKernelArg(DL, Int64Ty, ValueKind::HiddenGlobalOffsetY);
3800b57cec5SDimitry Andric   if (HiddenArgNumBytes >= 24)
3810b57cec5SDimitry Andric     emitKernelArg(DL, Int64Ty, ValueKind::HiddenGlobalOffsetZ);
3820b57cec5SDimitry Andric 
3830b57cec5SDimitry Andric   auto Int8PtrTy = Type::getInt8PtrTy(Func.getContext(),
3840b57cec5SDimitry Andric                                       AMDGPUAS::GLOBAL_ADDRESS);
3850b57cec5SDimitry Andric 
3860b57cec5SDimitry Andric   // Emit "printf buffer" argument if printf is used, otherwise emit dummy
3870b57cec5SDimitry Andric   // "none" argument.
3880b57cec5SDimitry Andric   if (HiddenArgNumBytes >= 32) {
3890b57cec5SDimitry Andric     if (Func.getParent()->getNamedMetadata("llvm.printf.fmts"))
3900b57cec5SDimitry Andric       emitKernelArg(DL, Int8PtrTy, ValueKind::HiddenPrintfBuffer);
391480093f4SDimitry Andric     else if (Func.getParent()->getFunction("__ockl_hostcall_internal")) {
392480093f4SDimitry Andric       // The printf runtime binding pass should have ensured that hostcall and
393480093f4SDimitry Andric       // printf are not used in the same module.
394480093f4SDimitry Andric       assert(!Func.getParent()->getNamedMetadata("llvm.printf.fmts"));
395480093f4SDimitry Andric       emitKernelArg(DL, Int8PtrTy, ValueKind::HiddenHostcallBuffer);
396480093f4SDimitry Andric     } else
3970b57cec5SDimitry Andric       emitKernelArg(DL, Int8PtrTy, ValueKind::HiddenNone);
3980b57cec5SDimitry Andric   }
3990b57cec5SDimitry Andric 
4000b57cec5SDimitry Andric   // Emit "default queue" and "completion action" arguments if enqueue kernel is
4010b57cec5SDimitry Andric   // used, otherwise emit dummy "none" arguments.
4020b57cec5SDimitry Andric   if (HiddenArgNumBytes >= 48) {
4030b57cec5SDimitry Andric     if (Func.hasFnAttribute("calls-enqueue-kernel")) {
4040b57cec5SDimitry Andric       emitKernelArg(DL, Int8PtrTy, ValueKind::HiddenDefaultQueue);
4050b57cec5SDimitry Andric       emitKernelArg(DL, Int8PtrTy, ValueKind::HiddenCompletionAction);
4060b57cec5SDimitry Andric     } else {
4070b57cec5SDimitry Andric       emitKernelArg(DL, Int8PtrTy, ValueKind::HiddenNone);
4080b57cec5SDimitry Andric       emitKernelArg(DL, Int8PtrTy, ValueKind::HiddenNone);
4090b57cec5SDimitry Andric     }
4100b57cec5SDimitry Andric   }
4110b57cec5SDimitry Andric 
4120b57cec5SDimitry Andric   // Emit the pointer argument for multi-grid object.
4130b57cec5SDimitry Andric   if (HiddenArgNumBytes >= 56)
4140b57cec5SDimitry Andric     emitKernelArg(DL, Int8PtrTy, ValueKind::HiddenMultiGridSyncArg);
4150b57cec5SDimitry Andric }
4160b57cec5SDimitry Andric 
4170b57cec5SDimitry Andric bool MetadataStreamerV2::emitTo(AMDGPUTargetStreamer &TargetStreamer) {
4180b57cec5SDimitry Andric   return TargetStreamer.EmitHSAMetadata(getHSAMetadata());
4190b57cec5SDimitry Andric }
4200b57cec5SDimitry Andric 
4210b57cec5SDimitry Andric void MetadataStreamerV2::begin(const Module &Mod) {
4220b57cec5SDimitry Andric   emitVersion();
4230b57cec5SDimitry Andric   emitPrintf(Mod);
4240b57cec5SDimitry Andric }
4250b57cec5SDimitry Andric 
4260b57cec5SDimitry Andric void MetadataStreamerV2::end() {
4270b57cec5SDimitry Andric   std::string HSAMetadataString;
4280b57cec5SDimitry Andric   if (toString(HSAMetadata, HSAMetadataString))
4290b57cec5SDimitry Andric     return;
4300b57cec5SDimitry Andric 
4310b57cec5SDimitry Andric   if (DumpHSAMetadata)
4320b57cec5SDimitry Andric     dump(HSAMetadataString);
4330b57cec5SDimitry Andric   if (VerifyHSAMetadata)
4340b57cec5SDimitry Andric     verify(HSAMetadataString);
4350b57cec5SDimitry Andric }
4360b57cec5SDimitry Andric 
4370b57cec5SDimitry Andric void MetadataStreamerV2::emitKernel(const MachineFunction &MF,
4380b57cec5SDimitry Andric                                     const SIProgramInfo &ProgramInfo) {
4390b57cec5SDimitry Andric   auto &Func = MF.getFunction();
4400b57cec5SDimitry Andric   if (Func.getCallingConv() != CallingConv::AMDGPU_KERNEL)
4410b57cec5SDimitry Andric     return;
4420b57cec5SDimitry Andric 
4430b57cec5SDimitry Andric   auto CodeProps = getHSACodeProps(MF, ProgramInfo);
4440b57cec5SDimitry Andric   auto DebugProps = getHSADebugProps(MF, ProgramInfo);
4450b57cec5SDimitry Andric 
4460b57cec5SDimitry Andric   HSAMetadata.mKernels.push_back(Kernel::Metadata());
4470b57cec5SDimitry Andric   auto &Kernel = HSAMetadata.mKernels.back();
4480b57cec5SDimitry Andric 
449*5ffd83dbSDimitry Andric   Kernel.mName = std::string(Func.getName());
4500b57cec5SDimitry Andric   Kernel.mSymbolName = (Twine(Func.getName()) + Twine("@kd")).str();
4510b57cec5SDimitry Andric   emitKernelLanguage(Func);
4520b57cec5SDimitry Andric   emitKernelAttrs(Func);
4530b57cec5SDimitry Andric   emitKernelArgs(Func);
4540b57cec5SDimitry Andric   HSAMetadata.mKernels.back().mCodeProps = CodeProps;
4550b57cec5SDimitry Andric   HSAMetadata.mKernels.back().mDebugProps = DebugProps;
4560b57cec5SDimitry Andric }
4570b57cec5SDimitry Andric 
4580b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
4590b57cec5SDimitry Andric // HSAMetadataStreamerV3
4600b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
4610b57cec5SDimitry Andric 
4620b57cec5SDimitry Andric void MetadataStreamerV3::dump(StringRef HSAMetadataString) const {
4630b57cec5SDimitry Andric   errs() << "AMDGPU HSA Metadata:\n" << HSAMetadataString << '\n';
4640b57cec5SDimitry Andric }
4650b57cec5SDimitry Andric 
4660b57cec5SDimitry Andric void MetadataStreamerV3::verify(StringRef HSAMetadataString) const {
4670b57cec5SDimitry Andric   errs() << "AMDGPU HSA Metadata Parser Test: ";
4680b57cec5SDimitry Andric 
4690b57cec5SDimitry Andric   msgpack::Document FromHSAMetadataString;
4700b57cec5SDimitry Andric 
4710b57cec5SDimitry Andric   if (!FromHSAMetadataString.fromYAML(HSAMetadataString)) {
4720b57cec5SDimitry Andric     errs() << "FAIL\n";
4730b57cec5SDimitry Andric     return;
4740b57cec5SDimitry Andric   }
4750b57cec5SDimitry Andric 
4760b57cec5SDimitry Andric   std::string ToHSAMetadataString;
4770b57cec5SDimitry Andric   raw_string_ostream StrOS(ToHSAMetadataString);
4780b57cec5SDimitry Andric   FromHSAMetadataString.toYAML(StrOS);
4790b57cec5SDimitry Andric 
4800b57cec5SDimitry Andric   errs() << (HSAMetadataString == StrOS.str() ? "PASS" : "FAIL") << '\n';
4810b57cec5SDimitry Andric   if (HSAMetadataString != ToHSAMetadataString) {
4820b57cec5SDimitry Andric     errs() << "Original input: " << HSAMetadataString << '\n'
4830b57cec5SDimitry Andric            << "Produced output: " << StrOS.str() << '\n';
4840b57cec5SDimitry Andric   }
4850b57cec5SDimitry Andric }
4860b57cec5SDimitry Andric 
4870b57cec5SDimitry Andric Optional<StringRef>
4880b57cec5SDimitry Andric MetadataStreamerV3::getAccessQualifier(StringRef AccQual) const {
4890b57cec5SDimitry Andric   return StringSwitch<Optional<StringRef>>(AccQual)
4900b57cec5SDimitry Andric       .Case("read_only", StringRef("read_only"))
4910b57cec5SDimitry Andric       .Case("write_only", StringRef("write_only"))
4920b57cec5SDimitry Andric       .Case("read_write", StringRef("read_write"))
4930b57cec5SDimitry Andric       .Default(None);
4940b57cec5SDimitry Andric }
4950b57cec5SDimitry Andric 
4960b57cec5SDimitry Andric Optional<StringRef>
4970b57cec5SDimitry Andric MetadataStreamerV3::getAddressSpaceQualifier(unsigned AddressSpace) const {
4980b57cec5SDimitry Andric   switch (AddressSpace) {
4990b57cec5SDimitry Andric   case AMDGPUAS::PRIVATE_ADDRESS:
5000b57cec5SDimitry Andric     return StringRef("private");
5010b57cec5SDimitry Andric   case AMDGPUAS::GLOBAL_ADDRESS:
5020b57cec5SDimitry Andric     return StringRef("global");
5030b57cec5SDimitry Andric   case AMDGPUAS::CONSTANT_ADDRESS:
5040b57cec5SDimitry Andric     return StringRef("constant");
5050b57cec5SDimitry Andric   case AMDGPUAS::LOCAL_ADDRESS:
5060b57cec5SDimitry Andric     return StringRef("local");
5070b57cec5SDimitry Andric   case AMDGPUAS::FLAT_ADDRESS:
5080b57cec5SDimitry Andric     return StringRef("generic");
5090b57cec5SDimitry Andric   case AMDGPUAS::REGION_ADDRESS:
5100b57cec5SDimitry Andric     return StringRef("region");
5110b57cec5SDimitry Andric   default:
5120b57cec5SDimitry Andric     return None;
5130b57cec5SDimitry Andric   }
5140b57cec5SDimitry Andric }
5150b57cec5SDimitry Andric 
5160b57cec5SDimitry Andric StringRef MetadataStreamerV3::getValueKind(Type *Ty, StringRef TypeQual,
5170b57cec5SDimitry Andric                                            StringRef BaseTypeName) const {
5180b57cec5SDimitry Andric   if (TypeQual.find("pipe") != StringRef::npos)
5190b57cec5SDimitry Andric     return "pipe";
5200b57cec5SDimitry Andric 
5210b57cec5SDimitry Andric   return StringSwitch<StringRef>(BaseTypeName)
5220b57cec5SDimitry Andric       .Case("image1d_t", "image")
5230b57cec5SDimitry Andric       .Case("image1d_array_t", "image")
5240b57cec5SDimitry Andric       .Case("image1d_buffer_t", "image")
5250b57cec5SDimitry Andric       .Case("image2d_t", "image")
5260b57cec5SDimitry Andric       .Case("image2d_array_t", "image")
5270b57cec5SDimitry Andric       .Case("image2d_array_depth_t", "image")
5280b57cec5SDimitry Andric       .Case("image2d_array_msaa_t", "image")
5290b57cec5SDimitry Andric       .Case("image2d_array_msaa_depth_t", "image")
5300b57cec5SDimitry Andric       .Case("image2d_depth_t", "image")
5310b57cec5SDimitry Andric       .Case("image2d_msaa_t", "image")
5320b57cec5SDimitry Andric       .Case("image2d_msaa_depth_t", "image")
5330b57cec5SDimitry Andric       .Case("image3d_t", "image")
5340b57cec5SDimitry Andric       .Case("sampler_t", "sampler")
5350b57cec5SDimitry Andric       .Case("queue_t", "queue")
5360b57cec5SDimitry Andric       .Default(isa<PointerType>(Ty)
5370b57cec5SDimitry Andric                    ? (Ty->getPointerAddressSpace() == AMDGPUAS::LOCAL_ADDRESS
5380b57cec5SDimitry Andric                           ? "dynamic_shared_pointer"
5390b57cec5SDimitry Andric                           : "global_buffer")
5400b57cec5SDimitry Andric                    : "by_value");
5410b57cec5SDimitry Andric }
5420b57cec5SDimitry Andric 
5430b57cec5SDimitry Andric std::string MetadataStreamerV3::getTypeName(Type *Ty, bool Signed) const {
5440b57cec5SDimitry Andric   switch (Ty->getTypeID()) {
5450b57cec5SDimitry Andric   case Type::IntegerTyID: {
5460b57cec5SDimitry Andric     if (!Signed)
5470b57cec5SDimitry Andric       return (Twine('u') + getTypeName(Ty, true)).str();
5480b57cec5SDimitry Andric 
5490b57cec5SDimitry Andric     auto BitWidth = Ty->getIntegerBitWidth();
5500b57cec5SDimitry Andric     switch (BitWidth) {
5510b57cec5SDimitry Andric     case 8:
5520b57cec5SDimitry Andric       return "char";
5530b57cec5SDimitry Andric     case 16:
5540b57cec5SDimitry Andric       return "short";
5550b57cec5SDimitry Andric     case 32:
5560b57cec5SDimitry Andric       return "int";
5570b57cec5SDimitry Andric     case 64:
5580b57cec5SDimitry Andric       return "long";
5590b57cec5SDimitry Andric     default:
5600b57cec5SDimitry Andric       return (Twine('i') + Twine(BitWidth)).str();
5610b57cec5SDimitry Andric     }
5620b57cec5SDimitry Andric   }
5630b57cec5SDimitry Andric   case Type::HalfTyID:
5640b57cec5SDimitry Andric     return "half";
5650b57cec5SDimitry Andric   case Type::FloatTyID:
5660b57cec5SDimitry Andric     return "float";
5670b57cec5SDimitry Andric   case Type::DoubleTyID:
5680b57cec5SDimitry Andric     return "double";
569*5ffd83dbSDimitry Andric   case Type::FixedVectorTyID: {
570*5ffd83dbSDimitry Andric     auto VecTy = cast<FixedVectorType>(Ty);
5710b57cec5SDimitry Andric     auto ElTy = VecTy->getElementType();
572*5ffd83dbSDimitry Andric     auto NumElements = VecTy->getNumElements();
5730b57cec5SDimitry Andric     return (Twine(getTypeName(ElTy, Signed)) + Twine(NumElements)).str();
5740b57cec5SDimitry Andric   }
5750b57cec5SDimitry Andric   default:
5760b57cec5SDimitry Andric     return "unknown";
5770b57cec5SDimitry Andric   }
5780b57cec5SDimitry Andric }
5790b57cec5SDimitry Andric 
5800b57cec5SDimitry Andric msgpack::ArrayDocNode
5810b57cec5SDimitry Andric MetadataStreamerV3::getWorkGroupDimensions(MDNode *Node) const {
5820b57cec5SDimitry Andric   auto Dims = HSAMetadataDoc->getArrayNode();
5830b57cec5SDimitry Andric   if (Node->getNumOperands() != 3)
5840b57cec5SDimitry Andric     return Dims;
5850b57cec5SDimitry Andric 
5860b57cec5SDimitry Andric   for (auto &Op : Node->operands())
5870b57cec5SDimitry Andric     Dims.push_back(Dims.getDocument()->getNode(
5880b57cec5SDimitry Andric         uint64_t(mdconst::extract<ConstantInt>(Op)->getZExtValue())));
5890b57cec5SDimitry Andric   return Dims;
5900b57cec5SDimitry Andric }
5910b57cec5SDimitry Andric 
5920b57cec5SDimitry Andric void MetadataStreamerV3::emitVersion() {
5930b57cec5SDimitry Andric   auto Version = HSAMetadataDoc->getArrayNode();
5940b57cec5SDimitry Andric   Version.push_back(Version.getDocument()->getNode(VersionMajor));
5950b57cec5SDimitry Andric   Version.push_back(Version.getDocument()->getNode(VersionMinor));
5960b57cec5SDimitry Andric   getRootMetadata("amdhsa.version") = Version;
5970b57cec5SDimitry Andric }
5980b57cec5SDimitry Andric 
5990b57cec5SDimitry Andric void MetadataStreamerV3::emitPrintf(const Module &Mod) {
6000b57cec5SDimitry Andric   auto Node = Mod.getNamedMetadata("llvm.printf.fmts");
6010b57cec5SDimitry Andric   if (!Node)
6020b57cec5SDimitry Andric     return;
6030b57cec5SDimitry Andric 
6040b57cec5SDimitry Andric   auto Printf = HSAMetadataDoc->getArrayNode();
6050b57cec5SDimitry Andric   for (auto Op : Node->operands())
6060b57cec5SDimitry Andric     if (Op->getNumOperands())
6070b57cec5SDimitry Andric       Printf.push_back(Printf.getDocument()->getNode(
6080b57cec5SDimitry Andric           cast<MDString>(Op->getOperand(0))->getString(), /*Copy=*/true));
6090b57cec5SDimitry Andric   getRootMetadata("amdhsa.printf") = Printf;
6100b57cec5SDimitry Andric }
6110b57cec5SDimitry Andric 
6120b57cec5SDimitry Andric void MetadataStreamerV3::emitKernelLanguage(const Function &Func,
6130b57cec5SDimitry Andric                                             msgpack::MapDocNode Kern) {
6140b57cec5SDimitry Andric   // TODO: What about other languages?
6150b57cec5SDimitry Andric   auto Node = Func.getParent()->getNamedMetadata("opencl.ocl.version");
6160b57cec5SDimitry Andric   if (!Node || !Node->getNumOperands())
6170b57cec5SDimitry Andric     return;
6180b57cec5SDimitry Andric   auto Op0 = Node->getOperand(0);
6190b57cec5SDimitry Andric   if (Op0->getNumOperands() <= 1)
6200b57cec5SDimitry Andric     return;
6210b57cec5SDimitry Andric 
6220b57cec5SDimitry Andric   Kern[".language"] = Kern.getDocument()->getNode("OpenCL C");
6230b57cec5SDimitry Andric   auto LanguageVersion = Kern.getDocument()->getArrayNode();
6240b57cec5SDimitry Andric   LanguageVersion.push_back(Kern.getDocument()->getNode(
6250b57cec5SDimitry Andric       mdconst::extract<ConstantInt>(Op0->getOperand(0))->getZExtValue()));
6260b57cec5SDimitry Andric   LanguageVersion.push_back(Kern.getDocument()->getNode(
6270b57cec5SDimitry Andric       mdconst::extract<ConstantInt>(Op0->getOperand(1))->getZExtValue()));
6280b57cec5SDimitry Andric   Kern[".language_version"] = LanguageVersion;
6290b57cec5SDimitry Andric }
6300b57cec5SDimitry Andric 
6310b57cec5SDimitry Andric void MetadataStreamerV3::emitKernelAttrs(const Function &Func,
6320b57cec5SDimitry Andric                                          msgpack::MapDocNode Kern) {
6330b57cec5SDimitry Andric 
6340b57cec5SDimitry Andric   if (auto Node = Func.getMetadata("reqd_work_group_size"))
6350b57cec5SDimitry Andric     Kern[".reqd_workgroup_size"] = getWorkGroupDimensions(Node);
6360b57cec5SDimitry Andric   if (auto Node = Func.getMetadata("work_group_size_hint"))
6370b57cec5SDimitry Andric     Kern[".workgroup_size_hint"] = getWorkGroupDimensions(Node);
6380b57cec5SDimitry Andric   if (auto Node = Func.getMetadata("vec_type_hint")) {
6390b57cec5SDimitry Andric     Kern[".vec_type_hint"] = Kern.getDocument()->getNode(
6400b57cec5SDimitry Andric         getTypeName(
6410b57cec5SDimitry Andric             cast<ValueAsMetadata>(Node->getOperand(0))->getType(),
6420b57cec5SDimitry Andric             mdconst::extract<ConstantInt>(Node->getOperand(1))->getZExtValue()),
6430b57cec5SDimitry Andric         /*Copy=*/true);
6440b57cec5SDimitry Andric   }
6450b57cec5SDimitry Andric   if (Func.hasFnAttribute("runtime-handle")) {
6460b57cec5SDimitry Andric     Kern[".device_enqueue_symbol"] = Kern.getDocument()->getNode(
6470b57cec5SDimitry Andric         Func.getFnAttribute("runtime-handle").getValueAsString().str(),
6480b57cec5SDimitry Andric         /*Copy=*/true);
6490b57cec5SDimitry Andric   }
6500b57cec5SDimitry Andric }
6510b57cec5SDimitry Andric 
6520b57cec5SDimitry Andric void MetadataStreamerV3::emitKernelArgs(const Function &Func,
6530b57cec5SDimitry Andric                                         msgpack::MapDocNode Kern) {
6540b57cec5SDimitry Andric   unsigned Offset = 0;
6550b57cec5SDimitry Andric   auto Args = HSAMetadataDoc->getArrayNode();
6560b57cec5SDimitry Andric   for (auto &Arg : Func.args())
6570b57cec5SDimitry Andric     emitKernelArg(Arg, Offset, Args);
6580b57cec5SDimitry Andric 
6590b57cec5SDimitry Andric   emitHiddenKernelArgs(Func, Offset, Args);
6600b57cec5SDimitry Andric 
6610b57cec5SDimitry Andric   Kern[".args"] = Args;
6620b57cec5SDimitry Andric }
6630b57cec5SDimitry Andric 
6640b57cec5SDimitry Andric void MetadataStreamerV3::emitKernelArg(const Argument &Arg, unsigned &Offset,
6650b57cec5SDimitry Andric                                        msgpack::ArrayDocNode Args) {
6660b57cec5SDimitry Andric   auto Func = Arg.getParent();
6670b57cec5SDimitry Andric   auto ArgNo = Arg.getArgNo();
6680b57cec5SDimitry Andric   const MDNode *Node;
6690b57cec5SDimitry Andric 
6700b57cec5SDimitry Andric   StringRef Name;
6710b57cec5SDimitry Andric   Node = Func->getMetadata("kernel_arg_name");
6720b57cec5SDimitry Andric   if (Node && ArgNo < Node->getNumOperands())
6730b57cec5SDimitry Andric     Name = cast<MDString>(Node->getOperand(ArgNo))->getString();
6740b57cec5SDimitry Andric   else if (Arg.hasName())
6750b57cec5SDimitry Andric     Name = Arg.getName();
6760b57cec5SDimitry Andric 
6770b57cec5SDimitry Andric   StringRef TypeName;
6780b57cec5SDimitry Andric   Node = Func->getMetadata("kernel_arg_type");
6790b57cec5SDimitry Andric   if (Node && ArgNo < Node->getNumOperands())
6800b57cec5SDimitry Andric     TypeName = cast<MDString>(Node->getOperand(ArgNo))->getString();
6810b57cec5SDimitry Andric 
6820b57cec5SDimitry Andric   StringRef BaseTypeName;
6830b57cec5SDimitry Andric   Node = Func->getMetadata("kernel_arg_base_type");
6840b57cec5SDimitry Andric   if (Node && ArgNo < Node->getNumOperands())
6850b57cec5SDimitry Andric     BaseTypeName = cast<MDString>(Node->getOperand(ArgNo))->getString();
6860b57cec5SDimitry Andric 
6870b57cec5SDimitry Andric   StringRef AccQual;
6880b57cec5SDimitry Andric   if (Arg.getType()->isPointerTy() && Arg.onlyReadsMemory() &&
6890b57cec5SDimitry Andric       Arg.hasNoAliasAttr()) {
6900b57cec5SDimitry Andric     AccQual = "read_only";
6910b57cec5SDimitry Andric   } else {
6920b57cec5SDimitry Andric     Node = Func->getMetadata("kernel_arg_access_qual");
6930b57cec5SDimitry Andric     if (Node && ArgNo < Node->getNumOperands())
6940b57cec5SDimitry Andric       AccQual = cast<MDString>(Node->getOperand(ArgNo))->getString();
6950b57cec5SDimitry Andric   }
6960b57cec5SDimitry Andric 
6970b57cec5SDimitry Andric   StringRef TypeQual;
6980b57cec5SDimitry Andric   Node = Func->getMetadata("kernel_arg_type_qual");
6990b57cec5SDimitry Andric   if (Node && ArgNo < Node->getNumOperands())
7000b57cec5SDimitry Andric     TypeQual = cast<MDString>(Node->getOperand(ArgNo))->getString();
7010b57cec5SDimitry Andric 
7020b57cec5SDimitry Andric   Type *Ty = Arg.getType();
7030b57cec5SDimitry Andric   const DataLayout &DL = Func->getParent()->getDataLayout();
7040b57cec5SDimitry Andric 
705*5ffd83dbSDimitry Andric   MaybeAlign PointeeAlign;
7060b57cec5SDimitry Andric   if (auto PtrTy = dyn_cast<PointerType>(Ty)) {
7070b57cec5SDimitry Andric     if (PtrTy->getAddressSpace() == AMDGPUAS::LOCAL_ADDRESS) {
708*5ffd83dbSDimitry Andric       PointeeAlign = DL.getValueOrABITypeAlignment(Arg.getParamAlign(),
709*5ffd83dbSDimitry Andric                                                    PtrTy->getElementType());
7100b57cec5SDimitry Andric     }
7110b57cec5SDimitry Andric   }
7120b57cec5SDimitry Andric 
7130b57cec5SDimitry Andric   emitKernelArg(Func->getParent()->getDataLayout(), Arg.getType(),
7140b57cec5SDimitry Andric                 getValueKind(Arg.getType(), TypeQual, BaseTypeName), Offset,
7150b57cec5SDimitry Andric                 Args, PointeeAlign, Name, TypeName, BaseTypeName, AccQual,
7160b57cec5SDimitry Andric                 TypeQual);
7170b57cec5SDimitry Andric }
7180b57cec5SDimitry Andric 
7190b57cec5SDimitry Andric void MetadataStreamerV3::emitKernelArg(const DataLayout &DL, Type *Ty,
7200b57cec5SDimitry Andric                                        StringRef ValueKind, unsigned &Offset,
7210b57cec5SDimitry Andric                                        msgpack::ArrayDocNode Args,
722*5ffd83dbSDimitry Andric                                        MaybeAlign PointeeAlign, StringRef Name,
7230b57cec5SDimitry Andric                                        StringRef TypeName,
7240b57cec5SDimitry Andric                                        StringRef BaseTypeName,
7250b57cec5SDimitry Andric                                        StringRef AccQual, StringRef TypeQual) {
7260b57cec5SDimitry Andric   auto Arg = Args.getDocument()->getMapNode();
7270b57cec5SDimitry Andric 
7280b57cec5SDimitry Andric   if (!Name.empty())
7290b57cec5SDimitry Andric     Arg[".name"] = Arg.getDocument()->getNode(Name, /*Copy=*/true);
7300b57cec5SDimitry Andric   if (!TypeName.empty())
7310b57cec5SDimitry Andric     Arg[".type_name"] = Arg.getDocument()->getNode(TypeName, /*Copy=*/true);
7320b57cec5SDimitry Andric   auto Size = DL.getTypeAllocSize(Ty);
733*5ffd83dbSDimitry Andric   Align Alignment = DL.getABITypeAlign(Ty);
7340b57cec5SDimitry Andric   Arg[".size"] = Arg.getDocument()->getNode(Size);
735*5ffd83dbSDimitry Andric   Offset = alignTo(Offset, Alignment);
7360b57cec5SDimitry Andric   Arg[".offset"] = Arg.getDocument()->getNode(Offset);
7370b57cec5SDimitry Andric   Offset += Size;
7380b57cec5SDimitry Andric   Arg[".value_kind"] = Arg.getDocument()->getNode(ValueKind, /*Copy=*/true);
7390b57cec5SDimitry Andric   if (PointeeAlign)
740*5ffd83dbSDimitry Andric     Arg[".pointee_align"] = Arg.getDocument()->getNode(PointeeAlign->value());
7410b57cec5SDimitry Andric 
7420b57cec5SDimitry Andric   if (auto PtrTy = dyn_cast<PointerType>(Ty))
7430b57cec5SDimitry Andric     if (auto Qualifier = getAddressSpaceQualifier(PtrTy->getAddressSpace()))
7440b57cec5SDimitry Andric       Arg[".address_space"] = Arg.getDocument()->getNode(*Qualifier, /*Copy=*/true);
7450b57cec5SDimitry Andric 
7460b57cec5SDimitry Andric   if (auto AQ = getAccessQualifier(AccQual))
7470b57cec5SDimitry Andric     Arg[".access"] = Arg.getDocument()->getNode(*AQ, /*Copy=*/true);
7480b57cec5SDimitry Andric 
7490b57cec5SDimitry Andric   // TODO: Emit Arg[".actual_access"].
7500b57cec5SDimitry Andric 
7510b57cec5SDimitry Andric   SmallVector<StringRef, 1> SplitTypeQuals;
7520b57cec5SDimitry Andric   TypeQual.split(SplitTypeQuals, " ", -1, false);
7530b57cec5SDimitry Andric   for (StringRef Key : SplitTypeQuals) {
7540b57cec5SDimitry Andric     if (Key == "const")
7550b57cec5SDimitry Andric       Arg[".is_const"] = Arg.getDocument()->getNode(true);
7560b57cec5SDimitry Andric     else if (Key == "restrict")
7570b57cec5SDimitry Andric       Arg[".is_restrict"] = Arg.getDocument()->getNode(true);
7580b57cec5SDimitry Andric     else if (Key == "volatile")
7590b57cec5SDimitry Andric       Arg[".is_volatile"] = Arg.getDocument()->getNode(true);
7600b57cec5SDimitry Andric     else if (Key == "pipe")
7610b57cec5SDimitry Andric       Arg[".is_pipe"] = Arg.getDocument()->getNode(true);
7620b57cec5SDimitry Andric   }
7630b57cec5SDimitry Andric 
7640b57cec5SDimitry Andric   Args.push_back(Arg);
7650b57cec5SDimitry Andric }
7660b57cec5SDimitry Andric 
7670b57cec5SDimitry Andric void MetadataStreamerV3::emitHiddenKernelArgs(const Function &Func,
7680b57cec5SDimitry Andric                                               unsigned &Offset,
7690b57cec5SDimitry Andric                                               msgpack::ArrayDocNode Args) {
7700b57cec5SDimitry Andric   int HiddenArgNumBytes =
7710b57cec5SDimitry Andric       getIntegerAttribute(Func, "amdgpu-implicitarg-num-bytes", 0);
7720b57cec5SDimitry Andric 
7730b57cec5SDimitry Andric   if (!HiddenArgNumBytes)
7740b57cec5SDimitry Andric     return;
7750b57cec5SDimitry Andric 
7760b57cec5SDimitry Andric   auto &DL = Func.getParent()->getDataLayout();
7770b57cec5SDimitry Andric   auto Int64Ty = Type::getInt64Ty(Func.getContext());
7780b57cec5SDimitry Andric 
7790b57cec5SDimitry Andric   if (HiddenArgNumBytes >= 8)
7800b57cec5SDimitry Andric     emitKernelArg(DL, Int64Ty, "hidden_global_offset_x", Offset, Args);
7810b57cec5SDimitry Andric   if (HiddenArgNumBytes >= 16)
7820b57cec5SDimitry Andric     emitKernelArg(DL, Int64Ty, "hidden_global_offset_y", Offset, Args);
7830b57cec5SDimitry Andric   if (HiddenArgNumBytes >= 24)
7840b57cec5SDimitry Andric     emitKernelArg(DL, Int64Ty, "hidden_global_offset_z", Offset, Args);
7850b57cec5SDimitry Andric 
7860b57cec5SDimitry Andric   auto Int8PtrTy =
7870b57cec5SDimitry Andric       Type::getInt8PtrTy(Func.getContext(), AMDGPUAS::GLOBAL_ADDRESS);
7880b57cec5SDimitry Andric 
7890b57cec5SDimitry Andric   // Emit "printf buffer" argument if printf is used, otherwise emit dummy
7900b57cec5SDimitry Andric   // "none" argument.
7910b57cec5SDimitry Andric   if (HiddenArgNumBytes >= 32) {
7920b57cec5SDimitry Andric     if (Func.getParent()->getNamedMetadata("llvm.printf.fmts"))
7930b57cec5SDimitry Andric       emitKernelArg(DL, Int8PtrTy, "hidden_printf_buffer", Offset, Args);
794480093f4SDimitry Andric     else if (Func.getParent()->getFunction("__ockl_hostcall_internal")) {
795480093f4SDimitry Andric       // The printf runtime binding pass should have ensured that hostcall and
796480093f4SDimitry Andric       // printf are not used in the same module.
797480093f4SDimitry Andric       assert(!Func.getParent()->getNamedMetadata("llvm.printf.fmts"));
798480093f4SDimitry Andric       emitKernelArg(DL, Int8PtrTy, "hidden_hostcall_buffer", Offset, Args);
799480093f4SDimitry Andric     } else
8000b57cec5SDimitry Andric       emitKernelArg(DL, Int8PtrTy, "hidden_none", Offset, Args);
8010b57cec5SDimitry Andric   }
8020b57cec5SDimitry Andric 
8030b57cec5SDimitry Andric   // Emit "default queue" and "completion action" arguments if enqueue kernel is
8040b57cec5SDimitry Andric   // used, otherwise emit dummy "none" arguments.
8050b57cec5SDimitry Andric   if (HiddenArgNumBytes >= 48) {
8060b57cec5SDimitry Andric     if (Func.hasFnAttribute("calls-enqueue-kernel")) {
8070b57cec5SDimitry Andric       emitKernelArg(DL, Int8PtrTy, "hidden_default_queue", Offset, Args);
8080b57cec5SDimitry Andric       emitKernelArg(DL, Int8PtrTy, "hidden_completion_action", Offset, Args);
8090b57cec5SDimitry Andric     } else {
8100b57cec5SDimitry Andric       emitKernelArg(DL, Int8PtrTy, "hidden_none", Offset, Args);
8110b57cec5SDimitry Andric       emitKernelArg(DL, Int8PtrTy, "hidden_none", Offset, Args);
8120b57cec5SDimitry Andric     }
8130b57cec5SDimitry Andric   }
8140b57cec5SDimitry Andric 
8150b57cec5SDimitry Andric   // Emit the pointer argument for multi-grid object.
8160b57cec5SDimitry Andric   if (HiddenArgNumBytes >= 56)
8170b57cec5SDimitry Andric     emitKernelArg(DL, Int8PtrTy, "hidden_multigrid_sync_arg", Offset, Args);
8180b57cec5SDimitry Andric }
8190b57cec5SDimitry Andric 
8200b57cec5SDimitry Andric msgpack::MapDocNode
8210b57cec5SDimitry Andric MetadataStreamerV3::getHSAKernelProps(const MachineFunction &MF,
8220b57cec5SDimitry Andric                                       const SIProgramInfo &ProgramInfo) const {
8230b57cec5SDimitry Andric   const GCNSubtarget &STM = MF.getSubtarget<GCNSubtarget>();
8240b57cec5SDimitry Andric   const SIMachineFunctionInfo &MFI = *MF.getInfo<SIMachineFunctionInfo>();
8250b57cec5SDimitry Andric   const Function &F = MF.getFunction();
8260b57cec5SDimitry Andric 
8270b57cec5SDimitry Andric   auto Kern = HSAMetadataDoc->getMapNode();
8280b57cec5SDimitry Andric 
8298bcb0991SDimitry Andric   Align MaxKernArgAlign;
8300b57cec5SDimitry Andric   Kern[".kernarg_segment_size"] = Kern.getDocument()->getNode(
8310b57cec5SDimitry Andric       STM.getKernArgSegmentSize(F, MaxKernArgAlign));
8320b57cec5SDimitry Andric   Kern[".group_segment_fixed_size"] =
8330b57cec5SDimitry Andric       Kern.getDocument()->getNode(ProgramInfo.LDSSize);
8340b57cec5SDimitry Andric   Kern[".private_segment_fixed_size"] =
8350b57cec5SDimitry Andric       Kern.getDocument()->getNode(ProgramInfo.ScratchSize);
8360b57cec5SDimitry Andric   Kern[".kernarg_segment_align"] =
8378bcb0991SDimitry Andric       Kern.getDocument()->getNode(std::max(Align(4), MaxKernArgAlign).value());
8380b57cec5SDimitry Andric   Kern[".wavefront_size"] =
8390b57cec5SDimitry Andric       Kern.getDocument()->getNode(STM.getWavefrontSize());
8400b57cec5SDimitry Andric   Kern[".sgpr_count"] = Kern.getDocument()->getNode(ProgramInfo.NumSGPR);
8410b57cec5SDimitry Andric   Kern[".vgpr_count"] = Kern.getDocument()->getNode(ProgramInfo.NumVGPR);
8420b57cec5SDimitry Andric   Kern[".max_flat_workgroup_size"] =
8430b57cec5SDimitry Andric       Kern.getDocument()->getNode(MFI.getMaxFlatWorkGroupSize());
8440b57cec5SDimitry Andric   Kern[".sgpr_spill_count"] =
8450b57cec5SDimitry Andric       Kern.getDocument()->getNode(MFI.getNumSpilledSGPRs());
8460b57cec5SDimitry Andric   Kern[".vgpr_spill_count"] =
8470b57cec5SDimitry Andric       Kern.getDocument()->getNode(MFI.getNumSpilledVGPRs());
8480b57cec5SDimitry Andric 
8490b57cec5SDimitry Andric   return Kern;
8500b57cec5SDimitry Andric }
8510b57cec5SDimitry Andric 
8520b57cec5SDimitry Andric bool MetadataStreamerV3::emitTo(AMDGPUTargetStreamer &TargetStreamer) {
8530b57cec5SDimitry Andric   return TargetStreamer.EmitHSAMetadata(*HSAMetadataDoc, true);
8540b57cec5SDimitry Andric }
8550b57cec5SDimitry Andric 
8560b57cec5SDimitry Andric void MetadataStreamerV3::begin(const Module &Mod) {
8570b57cec5SDimitry Andric   emitVersion();
8580b57cec5SDimitry Andric   emitPrintf(Mod);
8590b57cec5SDimitry Andric   getRootMetadata("amdhsa.kernels") = HSAMetadataDoc->getArrayNode();
8600b57cec5SDimitry Andric }
8610b57cec5SDimitry Andric 
8620b57cec5SDimitry Andric void MetadataStreamerV3::end() {
8630b57cec5SDimitry Andric   std::string HSAMetadataString;
8640b57cec5SDimitry Andric   raw_string_ostream StrOS(HSAMetadataString);
8650b57cec5SDimitry Andric   HSAMetadataDoc->toYAML(StrOS);
8660b57cec5SDimitry Andric 
8670b57cec5SDimitry Andric   if (DumpHSAMetadata)
8680b57cec5SDimitry Andric     dump(StrOS.str());
8690b57cec5SDimitry Andric   if (VerifyHSAMetadata)
8700b57cec5SDimitry Andric     verify(StrOS.str());
8710b57cec5SDimitry Andric }
8720b57cec5SDimitry Andric 
8730b57cec5SDimitry Andric void MetadataStreamerV3::emitKernel(const MachineFunction &MF,
8740b57cec5SDimitry Andric                                     const SIProgramInfo &ProgramInfo) {
8750b57cec5SDimitry Andric   auto &Func = MF.getFunction();
8760b57cec5SDimitry Andric   auto Kern = getHSAKernelProps(MF, ProgramInfo);
8770b57cec5SDimitry Andric 
8780b57cec5SDimitry Andric   assert(Func.getCallingConv() == CallingConv::AMDGPU_KERNEL ||
8790b57cec5SDimitry Andric          Func.getCallingConv() == CallingConv::SPIR_KERNEL);
8800b57cec5SDimitry Andric 
8810b57cec5SDimitry Andric   auto Kernels =
8820b57cec5SDimitry Andric       getRootMetadata("amdhsa.kernels").getArray(/*Convert=*/true);
8830b57cec5SDimitry Andric 
8840b57cec5SDimitry Andric   {
8850b57cec5SDimitry Andric     Kern[".name"] = Kern.getDocument()->getNode(Func.getName());
8860b57cec5SDimitry Andric     Kern[".symbol"] = Kern.getDocument()->getNode(
8870b57cec5SDimitry Andric         (Twine(Func.getName()) + Twine(".kd")).str(), /*Copy=*/true);
8880b57cec5SDimitry Andric     emitKernelLanguage(Func, Kern);
8890b57cec5SDimitry Andric     emitKernelAttrs(Func, Kern);
8900b57cec5SDimitry Andric     emitKernelArgs(Func, Kern);
8910b57cec5SDimitry Andric   }
8920b57cec5SDimitry Andric 
8930b57cec5SDimitry Andric   Kernels.push_back(Kern);
8940b57cec5SDimitry Andric }
8950b57cec5SDimitry Andric 
8960b57cec5SDimitry Andric } // end namespace HSAMD
8970b57cec5SDimitry Andric } // end namespace AMDGPU
8980b57cec5SDimitry Andric } // end namespace llvm
899