From: Konstantin Zhuravlyov Date: Sat, 14 Oct 2017 19:03:51 +0000 (+0000) Subject: AMDGPU: Bring HSA metadata on par with the specification X-Git-Url: https://granicus.if.org/sourcecode?a=commitdiff_plain;h=5556d8485b8b64095a7f097b44c01f1b379ba094;p=llvm AMDGPU: Bring HSA metadata on par with the specification Differential Revision: https://reviews.llvm.org/D38753 git-svn-id: https://llvm.org/svn/llvm-project/llvm/trunk@315821 91177308-0d34-0410-b5e6-96231b3b80d8 --- diff --git a/docs/AMDGPUUsage.rst b/docs/AMDGPUUsage.rst index 12e97e97f93..2c9993af1c5 100644 --- a/docs/AMDGPUUsage.rst +++ b/docs/AMDGPUUsage.rst @@ -889,7 +889,7 @@ non-AMD key names should be prefixed by "*vendor-name*.". See :ref:`amdgpu-amdhsa-code-object-kernel-attribute-metadata-mapping-table` for the mapping definition. - "Arguments" sequence of Sequence of mappings of the + "Args" sequence of Sequence of mappings of the mapping kernel arguments. See :ref:`amdgpu-amdhsa-code-object-kernel-argument-metadata-mapping-table` for the definition of the mapping. @@ -1099,7 +1099,7 @@ non-AMD key names should be prefixed by "*vendor-name*.". .. TODO Does this apply to GlobalBuffer? - "ActualAcc" string The actual memory accesses + "ActualAccQual" string The actual memory accesses performed by the kernel on the kernel argument. Only present if "ValueKind" is "GlobalBuffer", @@ -1224,7 +1224,8 @@ non-AMD key names should be prefixed by "*vendor-name*.". =================================== ============== ========= ============== String Key Value Type Required? Description =================================== ============== ========= ============== - "DebuggerABIVersion" string + "DebuggerABIVersion" sequence of + 2 integers "ReservedNumVGPRs" integer "ReservedFirstVGPR" integer "PrivateSegmentBufferSGPR" integer diff --git a/include/llvm/Support/AMDGPUMetadata.h b/include/llvm/Support/AMDGPUMetadata.h index b8084cef1c1..448e6e78e1d 100644 --- a/include/llvm/Support/AMDGPUMetadata.h +++ b/include/llvm/Support/AMDGPUMetadata.h @@ -133,13 +133,13 @@ struct Metadata final { /// \returns True if kernel attributes metadata is empty, false otherwise. bool empty() const { - return mReqdWorkGroupSize.empty() && mWorkGroupSizeHint.empty() && - mVecTypeHint.empty() && mRuntimeHandle.empty(); + return !notEmpty(); } /// \returns True if kernel attributes metadata is not empty, false otherwise. bool notEmpty() const { - return !empty(); + return !mReqdWorkGroupSize.empty() || !mWorkGroupSizeHint.empty() || + !mVecTypeHint.empty() || !mRuntimeHandle.empty(); } }; @@ -151,6 +151,10 @@ struct Metadata final { namespace Arg { namespace Key { +/// \brief Key for Kernel::Arg::Metadata::mName. +constexpr char Name[] = "Name"; +/// \brief Key for Kernel::Arg::Metadata::mTypeName. +constexpr char TypeName[] = "TypeName"; /// \brief Key for Kernel::Arg::Metadata::mSize. constexpr char Size[] = "Size"; /// \brief Key for Kernel::Arg::Metadata::mAlign. @@ -161,26 +165,28 @@ constexpr char ValueKind[] = "ValueKind"; constexpr char ValueType[] = "ValueType"; /// \brief Key for Kernel::Arg::Metadata::mPointeeAlign. constexpr char PointeeAlign[] = "PointeeAlign"; -/// \brief Key for Kernel::Arg::Metadata::mAccQual. -constexpr char AccQual[] = "AccQual"; /// \brief Key for Kernel::Arg::Metadata::mAddrSpaceQual. constexpr char AddrSpaceQual[] = "AddrSpaceQual"; +/// \brief Key for Kernel::Arg::Metadata::mAccQual. +constexpr char AccQual[] = "AccQual"; +/// \brief Key for Kernel::Arg::Metadata::mActualAccQual. +constexpr char ActualAccQual[] = "ActualAccQual"; /// \brief Key for Kernel::Arg::Metadata::mIsConst. constexpr char IsConst[] = "IsConst"; -/// \brief Key for Kernel::Arg::Metadata::mIsPipe. -constexpr char IsPipe[] = "IsPipe"; /// \brief Key for Kernel::Arg::Metadata::mIsRestrict. constexpr char IsRestrict[] = "IsRestrict"; /// \brief Key for Kernel::Arg::Metadata::mIsVolatile. constexpr char IsVolatile[] = "IsVolatile"; -/// \brief Key for Kernel::Arg::Metadata::mName. -constexpr char Name[] = "Name"; -/// \brief Key for Kernel::Arg::Metadata::mTypeName. -constexpr char TypeName[] = "TypeName"; +/// \brief Key for Kernel::Arg::Metadata::mIsPipe. +constexpr char IsPipe[] = "IsPipe"; } // end namespace Key /// \brief In-memory representation of kernel argument metadata. struct Metadata final { + /// \brief Name. Optional. + std::string mName = std::string(); + /// \brief Type name. Optional. + std::string mTypeName = std::string(); /// \brief Size in bytes. Required. uint32_t mSize = 0; /// \brief Alignment in bytes. Required. @@ -191,22 +197,20 @@ struct Metadata final { ValueType mValueType = ValueType::Unknown; /// \brief Pointee alignment in bytes. Optional. uint32_t mPointeeAlign = 0; - /// \brief Access qualifier. Optional. - AccessQualifier mAccQual = AccessQualifier::Unknown; /// \brief Address space qualifier. Optional. AddressSpaceQualifier mAddrSpaceQual = AddressSpaceQualifier::Unknown; + /// \brief Access qualifier. Optional. + AccessQualifier mAccQual = AccessQualifier::Unknown; + /// \brief Actual access qualifier. Optional. + AccessQualifier mActualAccQual = AccessQualifier::Unknown; /// \brief True if 'const' qualifier is specified. Optional. bool mIsConst = false; - /// \brief True if 'pipe' qualifier is specified. Optional. - bool mIsPipe = false; /// \brief True if 'restrict' qualifier is specified. Optional. bool mIsRestrict = false; /// \brief True if 'volatile' qualifier is specified. Optional. bool mIsVolatile = false; - /// \brief Name. Optional. - std::string mName = std::string(); - /// \brief Type name. Optional. - std::string mTypeName = std::string(); + /// \brief True if 'pipe' qualifier is specified. Optional. + bool mIsPipe = false; /// \brief Default constructor. Metadata() = default; @@ -222,51 +226,55 @@ namespace CodeProps { namespace Key { /// \brief Key for Kernel::CodeProps::Metadata::mKernargSegmentSize. constexpr char KernargSegmentSize[] = "KernargSegmentSize"; -/// \brief Key for Kernel::CodeProps::Metadata::mWorkgroupGroupSegmentSize. -constexpr char WorkgroupGroupSegmentSize[] = "WorkgroupGroupSegmentSize"; -/// \brief Key for Kernel::CodeProps::Metadata::mWorkitemPrivateSegmentSize. -constexpr char WorkitemPrivateSegmentSize[] = "WorkitemPrivateSegmentSize"; -/// \brief Key for Kernel::CodeProps::Metadata::mWavefrontNumSGPRs. -constexpr char WavefrontNumSGPRs[] = "WavefrontNumSGPRs"; -/// \brief Key for Kernel::CodeProps::Metadata::mWorkitemNumVGPRs. -constexpr char WorkitemNumVGPRs[] = "WorkitemNumVGPRs"; +/// \brief Key for Kernel::CodeProps::Metadata::mGroupSegmentFixedSize. +constexpr char GroupSegmentFixedSize[] = "GroupSegmentFixedSize"; +/// \brief Key for Kernel::CodeProps::Metadata::mPrivateSegmentFixedSize. +constexpr char PrivateSegmentFixedSize[] = "PrivateSegmentFixedSize"; /// \brief Key for Kernel::CodeProps::Metadata::mKernargSegmentAlign. constexpr char KernargSegmentAlign[] = "KernargSegmentAlign"; -/// \brief Key for Kernel::CodeProps::Metadata::mGroupSegmentAlign. -constexpr char GroupSegmentAlign[] = "GroupSegmentAlign"; -/// \brief Key for Kernel::CodeProps::Metadata::mPrivateSegmentAlign. -constexpr char PrivateSegmentAlign[] = "PrivateSegmentAlign"; /// \brief Key for Kernel::CodeProps::Metadata::mWavefrontSize. constexpr char WavefrontSize[] = "WavefrontSize"; +/// \brief Key for Kernel::CodeProps::Metadata::mNumSGPRs. +constexpr char NumSGPRs[] = "NumSGPRs"; +/// \brief Key for Kernel::CodeProps::Metadata::mNumVGPRs. +constexpr char NumVGPRs[] = "NumVGPRs"; +/// \brief Key for Kernel::CodeProps::Metadata::mMaxFlatWorkgroupSize. +constexpr char MaxFlatWorkgroupSize[] = "MaxFlatWorkgroupSize"; +/// \brief Key for Kernel::CodeProps::Metadata::mIsDynamicCallStack. +constexpr char IsDynamicCallStack[] = "IsDynamicCallStack"; +/// \brief Key for Kernel::CodeProps::Metadata::mIsXNACKEnabled. +constexpr char IsXNACKEnabled[] = "IsXNACKEnabled"; } // end namespace Key /// \brief In-memory representation of kernel code properties metadata. struct Metadata final { /// \brief Size in bytes of the kernarg segment memory. Kernarg segment memory - /// holds the values of the arguments to the kernel. Optional. + /// holds the values of the arguments to the kernel. Required. uint64_t mKernargSegmentSize = 0; /// \brief Size in bytes of the group segment memory required by a workgroup. /// This value does not include any dynamically allocated group segment memory - /// that may be added when the kernel is dispatched. Optional. - uint32_t mWorkgroupGroupSegmentSize = 0; + /// that may be added when the kernel is dispatched. Required. + uint32_t mGroupSegmentFixedSize = 0; /// \brief Size in bytes of the private segment memory required by a workitem. - /// Private segment memory includes arg, spill and private segments. Optional. - uint32_t mWorkitemPrivateSegmentSize = 0; + /// Private segment memory includes arg, spill and private segments. Required. + uint32_t mPrivateSegmentFixedSize = 0; + /// \brief Maximum byte alignment of variables used by the kernel in the + /// kernarg memory segment. Required. + uint32_t mKernargSegmentAlign = 0; + /// \brief Wavefront size. Required. + uint32_t mWavefrontSize = 0; /// \brief Total number of SGPRs used by a wavefront. Optional. - uint16_t mWavefrontNumSGPRs = 0; + uint16_t mNumSGPRs = 0; /// \brief Total number of VGPRs used by a workitem. Optional. - uint16_t mWorkitemNumVGPRs = 0; - /// \brief Maximum byte alignment of variables used by the kernel in the - /// kernarg memory segment. Expressed as a power of two. Optional. - uint8_t mKernargSegmentAlign = 0; - /// \brief Maximum byte alignment of variables used by the kernel in the - /// group memory segment. Expressed as a power of two. Optional. - uint8_t mGroupSegmentAlign = 0; - /// \brief Maximum byte alignment of variables used by the kernel in the - /// private memory segment. Expressed as a power of two. Optional. - uint8_t mPrivateSegmentAlign = 0; - /// \brief Wavefront size. Expressed as a power of two. Optional. - uint8_t mWavefrontSize = 0; + uint16_t mNumVGPRs = 0; + /// \brief Maximum flat work-group size supported by the kernel. Optional. + uint32_t mMaxFlatWorkgroupSize = 0; + /// \brief True if the generated machine code is using a dynamically sized + /// call stack. Optional. + bool mIsDynamicCallStack = false; + /// \brief True if the generated machine code is capable of supporting XNACK. + /// Optional. + bool mIsXNACKEnabled = false; /// \brief Default constructor. Metadata() = default; @@ -280,10 +288,7 @@ struct Metadata final { /// \returns True if kernel code properties metadata is not empty, false /// otherwise. bool notEmpty() const { - return mKernargSegmentSize || mWorkgroupGroupSegmentSize || - mWorkitemPrivateSegmentSize || mWavefrontNumSGPRs || - mWorkitemNumVGPRs || mKernargSegmentAlign || mGroupSegmentAlign || - mPrivateSegmentAlign || mWavefrontSize; + return true; } }; @@ -349,6 +354,8 @@ struct Metadata final { namespace Key { /// \brief Key for Kernel::Metadata::mName. constexpr char Name[] = "Name"; +/// \brief Key for Kernel::Metadata::mSymbolName. +constexpr char SymbolName[] = "SymbolName"; /// \brief Key for Kernel::Metadata::mLanguage. constexpr char Language[] = "Language"; /// \brief Key for Kernel::Metadata::mLanguageVersion. @@ -365,8 +372,10 @@ constexpr char DebugProps[] = "DebugProps"; /// \brief In-memory representation of kernel metadata. struct Metadata final { - /// \brief Name. Required. + /// \brief Kernel source name. Required. std::string mName = std::string(); + /// \brief Kernel descriptor name. Required. + std::string mSymbolName = std::string(); /// \brief Language. Optional. std::string mLanguage = std::string(); /// \brief Language version. Optional. @@ -401,7 +410,7 @@ struct Metadata final { std::vector mVersion = std::vector(); /// \brief Printf metadata. Optional. std::vector mPrintf = std::vector(); - /// \brief Kernels metadata. Optional. + /// \brief Kernels metadata. Required. std::vector mKernels = std::vector(); /// \brief Default constructor. diff --git a/lib/Support/AMDGPUMetadata.cpp b/lib/Support/AMDGPUMetadata.cpp index 00fa91a7cf0..8a58f91b37a 100644 --- a/lib/Support/AMDGPUMetadata.cpp +++ b/lib/Support/AMDGPUMetadata.cpp @@ -104,46 +104,50 @@ struct MappingTraits { template <> struct MappingTraits { static void mapping(IO &YIO, Kernel::Arg::Metadata &MD) { + YIO.mapOptional(Kernel::Arg::Key::Name, MD.mName, std::string()); + YIO.mapOptional(Kernel::Arg::Key::TypeName, MD.mTypeName, std::string()); YIO.mapRequired(Kernel::Arg::Key::Size, MD.mSize); YIO.mapRequired(Kernel::Arg::Key::Align, MD.mAlign); YIO.mapRequired(Kernel::Arg::Key::ValueKind, MD.mValueKind); YIO.mapRequired(Kernel::Arg::Key::ValueType, MD.mValueType); YIO.mapOptional(Kernel::Arg::Key::PointeeAlign, MD.mPointeeAlign, uint32_t(0)); - YIO.mapOptional(Kernel::Arg::Key::AccQual, MD.mAccQual, - AccessQualifier::Unknown); YIO.mapOptional(Kernel::Arg::Key::AddrSpaceQual, MD.mAddrSpaceQual, AddressSpaceQualifier::Unknown); + YIO.mapOptional(Kernel::Arg::Key::AccQual, MD.mAccQual, + AccessQualifier::Unknown); + YIO.mapOptional(Kernel::Arg::Key::ActualAccQual, MD.mActualAccQual, + AccessQualifier::Unknown); YIO.mapOptional(Kernel::Arg::Key::IsConst, MD.mIsConst, false); - YIO.mapOptional(Kernel::Arg::Key::IsPipe, MD.mIsPipe, false); YIO.mapOptional(Kernel::Arg::Key::IsRestrict, MD.mIsRestrict, false); YIO.mapOptional(Kernel::Arg::Key::IsVolatile, MD.mIsVolatile, false); - YIO.mapOptional(Kernel::Arg::Key::Name, MD.mName, std::string()); - YIO.mapOptional(Kernel::Arg::Key::TypeName, MD.mTypeName, std::string()); + YIO.mapOptional(Kernel::Arg::Key::IsPipe, MD.mIsPipe, false); } }; template <> struct MappingTraits { static void mapping(IO &YIO, Kernel::CodeProps::Metadata &MD) { - YIO.mapOptional(Kernel::CodeProps::Key::KernargSegmentSize, - MD.mKernargSegmentSize, uint64_t(0)); - YIO.mapOptional(Kernel::CodeProps::Key::WorkgroupGroupSegmentSize, - MD.mWorkgroupGroupSegmentSize, uint32_t(0)); - YIO.mapOptional(Kernel::CodeProps::Key::WorkitemPrivateSegmentSize, - MD.mWorkitemPrivateSegmentSize, uint32_t(0)); - YIO.mapOptional(Kernel::CodeProps::Key::WavefrontNumSGPRs, - MD.mWavefrontNumSGPRs, uint16_t(0)); - YIO.mapOptional(Kernel::CodeProps::Key::WorkitemNumVGPRs, - MD.mWorkitemNumVGPRs, uint16_t(0)); - YIO.mapOptional(Kernel::CodeProps::Key::KernargSegmentAlign, - MD.mKernargSegmentAlign, uint8_t(0)); - YIO.mapOptional(Kernel::CodeProps::Key::GroupSegmentAlign, - MD.mGroupSegmentAlign, uint8_t(0)); - YIO.mapOptional(Kernel::CodeProps::Key::PrivateSegmentAlign, - MD.mPrivateSegmentAlign, uint8_t(0)); - YIO.mapOptional(Kernel::CodeProps::Key::WavefrontSize, - MD.mWavefrontSize, uint8_t(0)); + YIO.mapRequired(Kernel::CodeProps::Key::KernargSegmentSize, + MD.mKernargSegmentSize); + YIO.mapRequired(Kernel::CodeProps::Key::GroupSegmentFixedSize, + MD.mGroupSegmentFixedSize); + YIO.mapRequired(Kernel::CodeProps::Key::PrivateSegmentFixedSize, + MD.mPrivateSegmentFixedSize); + YIO.mapRequired(Kernel::CodeProps::Key::KernargSegmentAlign, + MD.mKernargSegmentAlign); + YIO.mapRequired(Kernel::CodeProps::Key::WavefrontSize, + MD.mWavefrontSize); + YIO.mapOptional(Kernel::CodeProps::Key::NumSGPRs, + MD.mNumSGPRs, uint16_t(0)); + YIO.mapOptional(Kernel::CodeProps::Key::NumVGPRs, + MD.mNumVGPRs, uint16_t(0)); + YIO.mapOptional(Kernel::CodeProps::Key::MaxFlatWorkgroupSize, + MD.mMaxFlatWorkgroupSize, uint32_t(0)); + YIO.mapOptional(Kernel::CodeProps::Key::IsDynamicCallStack, + MD.mIsDynamicCallStack, false); + YIO.mapOptional(Kernel::CodeProps::Key::IsXNACKEnabled, + MD.mIsXNACKEnabled, false); } }; @@ -167,6 +171,7 @@ template <> struct MappingTraits { static void mapping(IO &YIO, Kernel::Metadata &MD) { YIO.mapRequired(Kernel::Key::Name, MD.mName); + YIO.mapRequired(Kernel::Key::SymbolName, MD.mSymbolName); YIO.mapOptional(Kernel::Key::Language, MD.mLanguage, std::string()); YIO.mapOptional(Kernel::Key::LanguageVersion, MD.mLanguageVersion, std::vector()); diff --git a/lib/Target/AMDGPU/AMDGPUAsmPrinter.cpp b/lib/Target/AMDGPU/AMDGPUAsmPrinter.cpp index ca828b45c54..b3650b4ac89 100644 --- a/lib/Target/AMDGPU/AMDGPUAsmPrinter.cpp +++ b/lib/Target/AMDGPU/AMDGPUAsmPrinter.cpp @@ -199,7 +199,9 @@ void AMDGPUAsmPrinter::EmitFunctionBodyStart() { if (TM.getTargetTriple().getOS() != Triple::AMDHSA) return; - HSAMetadataStream.emitKernel(*MF->getFunction(), KernelCode); + HSAMetadataStream.emitKernel(*MF->getFunction(), + getHSACodeProps(*MF, CurrentProgramInfo), + getHSADebugProps(*MF, CurrentProgramInfo)); } void AMDGPUAsmPrinter::EmitFunctionEntryLabel() { @@ -1155,6 +1157,53 @@ void AMDGPUAsmPrinter::getAmdKernelCode(amd_kernel_code_t &Out, } } +AMDGPU::HSAMD::Kernel::CodeProps::Metadata AMDGPUAsmPrinter::getHSACodeProps( + const MachineFunction &MF, + const SIProgramInfo &ProgramInfo) const { + const SISubtarget &STM = MF.getSubtarget(); + const SIMachineFunctionInfo &MFI = *MF.getInfo(); + HSAMD::Kernel::CodeProps::Metadata HSACodeProps; + + HSACodeProps.mKernargSegmentSize = + STM.getKernArgSegmentSize(MF, MFI.getABIArgOffset()); + HSACodeProps.mGroupSegmentFixedSize = ProgramInfo.LDSSize; + HSACodeProps.mPrivateSegmentFixedSize = ProgramInfo.ScratchSize; + HSACodeProps.mKernargSegmentAlign = + std::max(uint32_t(4), MFI.getMaxKernArgAlign()); + HSACodeProps.mWavefrontSize = STM.getWavefrontSize(); + HSACodeProps.mNumSGPRs = CurrentProgramInfo.NumSGPR; + HSACodeProps.mNumVGPRs = CurrentProgramInfo.NumVGPR; + // TODO: Emit HSACodeProps.mMaxFlatWorkgroupSize. + HSACodeProps.mIsDynamicCallStack = ProgramInfo.DynamicCallStack; + HSACodeProps.mIsXNACKEnabled = STM.isXNACKEnabled(); + + return HSACodeProps; +} + +AMDGPU::HSAMD::Kernel::DebugProps::Metadata AMDGPUAsmPrinter::getHSADebugProps( + const MachineFunction &MF, + const SIProgramInfo &ProgramInfo) const { + const SISubtarget &STM = MF.getSubtarget(); + HSAMD::Kernel::DebugProps::Metadata HSADebugProps; + + if (!STM.debuggerSupported()) + return HSADebugProps; + + HSADebugProps.mDebuggerABIVersion.push_back(1); + HSADebugProps.mDebuggerABIVersion.push_back(0); + HSADebugProps.mReservedNumVGPRs = ProgramInfo.ReservedVGPRCount; + HSADebugProps.mReservedFirstVGPR = ProgramInfo.ReservedVGPRFirst; + + if (STM.debuggerEmitPrologue()) { + HSADebugProps.mPrivateSegmentBufferSGPR = + ProgramInfo.DebuggerPrivateSegmentBufferSGPR; + HSADebugProps.mWavefrontPrivateSegmentOffsetSGPR = + ProgramInfo.DebuggerWavefrontPrivateSegmentOffsetSGPR; + } + + return HSADebugProps; +} + bool AMDGPUAsmPrinter::PrintAsmOperand(const MachineInstr *MI, unsigned OpNo, unsigned AsmVariant, const char *ExtraCode, raw_ostream &O) { diff --git a/lib/Target/AMDGPU/AMDGPUAsmPrinter.h b/lib/Target/AMDGPU/AMDGPUAsmPrinter.h index 88503e75dd2..74e38455058 100644 --- a/lib/Target/AMDGPU/AMDGPUAsmPrinter.h +++ b/lib/Target/AMDGPU/AMDGPUAsmPrinter.h @@ -128,6 +128,13 @@ private: unsigned &NumSGPR, unsigned &NumVGPR) const; + AMDGPU::HSAMD::Kernel::CodeProps::Metadata getHSACodeProps( + const MachineFunction &MF, + const SIProgramInfo &ProgramInfo) const; + AMDGPU::HSAMD::Kernel::DebugProps::Metadata getHSADebugProps( + const MachineFunction &MF, + const SIProgramInfo &ProgramInfo) const; + /// \brief Emit register usage information so that the GPU driver /// can correctly setup the GPU state. void EmitProgramInfoR600(const MachineFunction &MF); diff --git a/lib/Target/AMDGPU/MCTargetDesc/AMDGPUHSAMetadataStreamer.cpp b/lib/Target/AMDGPU/MCTargetDesc/AMDGPUHSAMetadataStreamer.cpp index 7dda7c16651..dacf5d37aa1 100644 --- a/lib/Target/AMDGPU/MCTargetDesc/AMDGPUHSAMetadataStreamer.cpp +++ b/lib/Target/AMDGPU/MCTargetDesc/AMDGPUHSAMetadataStreamer.cpp @@ -279,10 +279,15 @@ void MetadataStreamer::emitKernelArg(const Argument &Arg) { auto ArgNo = Arg.getArgNo(); const MDNode *Node; - StringRef TypeQual; - Node = Func->getMetadata("kernel_arg_type_qual"); + StringRef Name; + Node = Func->getMetadata("kernel_arg_name"); if (Node && ArgNo < Node->getNumOperands()) - TypeQual = cast(Node->getOperand(ArgNo))->getString(); + Name = cast(Node->getOperand(ArgNo))->getString(); + + StringRef TypeName; + Node = Func->getMetadata("kernel_arg_type"); + if (Node && ArgNo < Node->getNumOperands()) + TypeName = cast(Node->getOperand(ArgNo))->getString(); StringRef BaseTypeName; Node = Func->getMetadata("kernel_arg_base_type"); @@ -299,28 +304,25 @@ void MetadataStreamer::emitKernelArg(const Argument &Arg) { AccQual = cast(Node->getOperand(ArgNo))->getString(); } - StringRef Name; - Node = Func->getMetadata("kernel_arg_name"); - if (Node && ArgNo < Node->getNumOperands()) - Name = cast(Node->getOperand(ArgNo))->getString(); - - StringRef TypeName; - Node = Func->getMetadata("kernel_arg_type"); + StringRef TypeQual; + Node = Func->getMetadata("kernel_arg_type_qual"); if (Node && ArgNo < Node->getNumOperands()) - TypeName = cast(Node->getOperand(ArgNo))->getString(); + TypeQual = cast(Node->getOperand(ArgNo))->getString(); emitKernelArg(Func->getParent()->getDataLayout(), Arg.getType(), - getValueKind(Arg.getType(), TypeQual, BaseTypeName), TypeQual, - BaseTypeName, AccQual, Name, TypeName); + getValueKind(Arg.getType(), TypeQual, BaseTypeName), Name, + TypeName, BaseTypeName, AccQual, TypeQual); } void MetadataStreamer::emitKernelArg(const DataLayout &DL, Type *Ty, - ValueKind ValueKind, StringRef TypeQual, - StringRef BaseTypeName, StringRef AccQual, - StringRef Name, StringRef TypeName) { + ValueKind ValueKind, StringRef Name, + StringRef TypeName, StringRef BaseTypeName, + StringRef AccQual, StringRef TypeQual) { HSAMetadata.mKernels.back().mArgs.push_back(Kernel::Arg::Metadata()); auto &Arg = HSAMetadata.mKernels.back().mArgs.back(); + Arg.mName = Name; + Arg.mTypeName = TypeName; Arg.mSize = DL.getTypeAllocSize(Ty); Arg.mAlign = DL.getABITypeAlignment(Ty); Arg.mValueKind = ValueKind; @@ -332,62 +334,25 @@ void MetadataStreamer::emitKernelArg(const DataLayout &DL, Type *Ty, Arg.mPointeeAlign = DL.getABITypeAlignment(ElTy); } - Arg.mAccQual = getAccessQualifier(AccQual); - if (auto PtrTy = dyn_cast(Ty)) Arg.mAddrSpaceQual = getAddressSpaceQualifer(PtrTy->getAddressSpace()); + Arg.mAccQual = getAccessQualifier(AccQual); + + // TODO: Emit Arg.mActualAccQual. + SmallVector SplitTypeQuals; TypeQual.split(SplitTypeQuals, " ", -1, false); for (StringRef Key : SplitTypeQuals) { auto P = StringSwitch(Key) .Case("const", &Arg.mIsConst) - .Case("pipe", &Arg.mIsPipe) .Case("restrict", &Arg.mIsRestrict) .Case("volatile", &Arg.mIsVolatile) + .Case("pipe", &Arg.mIsPipe) .Default(nullptr); if (P) *P = true; } - - Arg.mName = Name; - Arg.mTypeName = TypeName; -} - -void MetadataStreamer::emitKernelCodeProps( - const amd_kernel_code_t &KernelCode) { - auto &CodeProps = HSAMetadata.mKernels.back().mCodeProps; - - CodeProps.mKernargSegmentSize = KernelCode.kernarg_segment_byte_size; - CodeProps.mWorkgroupGroupSegmentSize = - KernelCode.workgroup_group_segment_byte_size; - CodeProps.mWorkitemPrivateSegmentSize = - KernelCode.workitem_private_segment_byte_size; - CodeProps.mWavefrontNumSGPRs = KernelCode.wavefront_sgpr_count; - CodeProps.mWorkitemNumVGPRs = KernelCode.workitem_vgpr_count; - CodeProps.mKernargSegmentAlign = KernelCode.kernarg_segment_alignment; - CodeProps.mGroupSegmentAlign = KernelCode.group_segment_alignment; - CodeProps.mPrivateSegmentAlign = KernelCode.private_segment_alignment; - CodeProps.mWavefrontSize = KernelCode.wavefront_size; -} - -void MetadataStreamer::emitKernelDebugProps( - const amd_kernel_code_t &KernelCode) { - if (!(KernelCode.code_properties & AMD_CODE_PROPERTY_IS_DEBUG_SUPPORTED)) - return; - - auto &DebugProps = HSAMetadata.mKernels.back().mDebugProps; - - // FIXME: Need to pass down debugger ABI version through features. This is ok - // for now because we only have one version. - DebugProps.mDebuggerABIVersion.push_back(1); - DebugProps.mDebuggerABIVersion.push_back(0); - DebugProps.mReservedNumVGPRs = KernelCode.reserved_vgpr_count; - DebugProps.mReservedFirstVGPR = KernelCode.reserved_vgpr_first; - DebugProps.mPrivateSegmentBufferSGPR = - KernelCode.debug_private_segment_buffer_sgpr; - DebugProps.mWavefrontPrivateSegmentOffsetSGPR = - KernelCode.debug_wavefront_private_segment_offset_sgpr; } void MetadataStreamer::begin(const Module &Mod) { @@ -407,8 +372,10 @@ void MetadataStreamer::end() { verify(HSAMetadataString); } -void MetadataStreamer::emitKernel(const Function &Func, - const amd_kernel_code_t &KernelCode) { +void MetadataStreamer::emitKernel( + const Function &Func, + const Kernel::CodeProps::Metadata &CodeProps, + const Kernel::DebugProps::Metadata &DebugProps) { if (Func.getCallingConv() != CallingConv::AMDGPU_KERNEL) return; @@ -416,11 +383,12 @@ void MetadataStreamer::emitKernel(const Function &Func, auto &Kernel = HSAMetadata.mKernels.back(); Kernel.mName = Func.getName(); + Kernel.mSymbolName = (Twine(Func.getName()) + Twine("@kd")).str(); emitKernelLanguage(Func); emitKernelAttrs(Func); emitKernelArgs(Func); - emitKernelCodeProps(KernelCode); - emitKernelDebugProps(KernelCode); + HSAMetadata.mKernels.back().mCodeProps = CodeProps; + HSAMetadata.mKernels.back().mDebugProps = DebugProps; } } // end namespace HSAMD diff --git a/lib/Target/AMDGPU/MCTargetDesc/AMDGPUHSAMetadataStreamer.h b/lib/Target/AMDGPU/MCTargetDesc/AMDGPUHSAMetadataStreamer.h index 6a101d12914..bd6515521a7 100644 --- a/lib/Target/AMDGPU/MCTargetDesc/AMDGPUHSAMetadataStreamer.h +++ b/lib/Target/AMDGPU/MCTargetDesc/AMDGPUHSAMetadataStreamer.h @@ -68,13 +68,9 @@ private: void emitKernelArg(const Argument &Arg); void emitKernelArg(const DataLayout &DL, Type *Ty, ValueKind ValueKind, - StringRef TypeQual = "", StringRef BaseTypeName = "", - StringRef AccQual = "", StringRef Name = "", - StringRef TypeName = ""); - - void emitKernelCodeProps(const amd_kernel_code_t &KernelCode); - - void emitKernelDebugProps(const amd_kernel_code_t &KernelCode); + StringRef Name = "", StringRef TypeName = "", + StringRef BaseTypeName = "", StringRef AccQual = "", + StringRef TypeQual = ""); public: MetadataStreamer() = default; @@ -88,7 +84,9 @@ public: void end(); - void emitKernel(const Function &Func, const amd_kernel_code_t &KernelCode); + void emitKernel(const Function &Func, + const Kernel::CodeProps::Metadata &CodeProps, + const Kernel::DebugProps::Metadata &DebugProps); }; } // end namespace HSAMD diff --git a/test/CodeGen/AMDGPU/elf-notes.ll b/test/CodeGen/AMDGPU/elf-notes.ll index 5ed14ead646..1409356d2ed 100644 --- a/test/CodeGen/AMDGPU/elf-notes.ll +++ b/test/CodeGen/AMDGPU/elf-notes.ll @@ -41,13 +41,15 @@ ; OSABI-HSA-ELF: --- ; OSABI-HSA-ELF: Version: [ 1, 0 ] ; OSABI-HSA-ELF: Kernels: -; OSABI-HSA-ELF: - Name: elf_notes +; OSABI-HSA-ELF: - Name: elf_notes +; OSABI-HSA-ELF: SymbolName: 'elf_notes@kd' ; OSABI-HSA-ELF: CodeProps: -; OSABI-HSA-ELF: WavefrontNumSGPRs: 96 -; OSABI-HSA-ELF: KernargSegmentAlign: 32 -; OSABI-HSA-ELF: GroupSegmentAlign: 4 -; OSABI-HSA-ELF: PrivateSegmentAlign: 4 -; OSABI-HSA-ELF: WavefrontSize: 6 +; OSABI-HSA-ELF: KernargSegmentSize: 0 +; OSABI-HSA-ELF: GroupSegmentFixedSize: 0 +; OSABI-HSA-ELF: PrivateSegmentFixedSize: 0 +; OSABI-HSA-ELF: KernargSegmentAlign: 4 +; OSABI-HSA-ELF: WavefrontSize: 64 +; OSABI-HSA-ELF: NumSGPRs: 96 ; OSABI-HSA-ELF: ... ; OSABI-HSA-ELF-NOT: Unknown note type ; OSABI-HSA-ELF-NOT: NT_AMD_AMDGPU_PAL_METADATA (PAL Metadata) diff --git a/test/CodeGen/AMDGPU/hsa-metadata-deduce-ro-arg.ll b/test/CodeGen/AMDGPU/hsa-metadata-deduce-ro-arg.ll index 508bef0b22f..c07c5556ce3 100644 --- a/test/CodeGen/AMDGPU/hsa-metadata-deduce-ro-arg.ll +++ b/test/CodeGen/AMDGPU/hsa-metadata-deduce-ro-arg.ll @@ -1,24 +1,24 @@ ; RUN: llc -mtriple=amdgcn-amd-amdhsa -filetype=obj -o - < %s | llvm-readobj -elf-output-style=GNU -notes | FileCheck %s ; CHECK: - Name: test_ro_arg -; CHECK: Args: -; CHECK-NEXT: - Size: 8 +; CHECK-NEXT: SymbolName: 'test_ro_arg@kd' +; CHECK-NEXT: Args: +; CHECK-NEXT: - TypeName: 'float*' +; CHECK-NEXT: Size: 8 ; CHECK-NEXT: Align: 8 ; CHECK-NEXT: ValueKind: GlobalBuffer ; CHECK-NEXT: ValueType: F32 -; CHECK-NEXT: AccQual: ReadOnly ; CHECK-NEXT: AddrSpaceQual: Global +; CHECK-NEXT: AccQual: ReadOnly ; CHECK-NEXT: IsConst: true ; CHECK-NEXT: IsRestrict: true -; CHECK-NEXT: TypeName: 'float*' - -; CHECK-NEXT: - Size: 8 +; CHECK-NEXT: - TypeName: 'float*' +; CHECK-NEXT: Size: 8 ; CHECK-NEXT: Align: 8 ; CHECK-NEXT: ValueKind: GlobalBuffer ; CHECK-NEXT: ValueType: F32 -; CHECK-NEXT: AccQual: Default ; CHECK-NEXT: AddrSpaceQual: Global -; CHECK-NEXT: TypeName: 'float*' +; CHECK-NEXT: AccQual: Default define amdgpu_kernel void @test_ro_arg(float addrspace(1)* noalias readonly %in, float addrspace(1)* %out) !kernel_arg_addr_space !0 !kernel_arg_access_qual !1 !kernel_arg_type !2 @@ -30,4 +30,3 @@ define amdgpu_kernel void @test_ro_arg(float addrspace(1)* noalias readonly %in, !1 = !{!"none", !"none"} !2 = !{!"float*", !"float*"} !3 = !{!"const restrict", !""} - diff --git a/test/CodeGen/AMDGPU/hsa-metadata-from-llvm-ir-full.ll b/test/CodeGen/AMDGPU/hsa-metadata-from-llvm-ir-full.ll index da7be20bb8b..4ac9bacebe1 100644 --- a/test/CodeGen/AMDGPU/hsa-metadata-from-llvm-ir-full.ll +++ b/test/CodeGen/AMDGPU/hsa-metadata-from-llvm-ir-full.ll @@ -1,3 +1,6 @@ +; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx700 -filetype=obj -o - < %s | llvm-readobj -elf-output-style=GNU -notes | FileCheck --check-prefix=CHECK --check-prefix=GFX700 --check-prefix=NOTES %s +; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx800 -filetype=obj -o - < %s | llvm-readobj -elf-output-style=GNU -notes | FileCheck --check-prefix=CHECK --check-prefix=GFX800 --check-prefix=NOTES %s +; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx900 -filetype=obj -o - < %s | llvm-readobj -elf-output-style=GNU -notes | FileCheck --check-prefix=CHECK --check-prefix=GFX900 --check-prefix=NOTES %s ; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx700 -amdgpu-dump-hsa-metadata -amdgpu-verify-hsa-metadata -filetype=obj -o - < %s 2>&1 | FileCheck --check-prefix=PARSER %s ; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx800 -amdgpu-dump-hsa-metadata -amdgpu-verify-hsa-metadata -filetype=obj -o - < %s 2>&1 | FileCheck --check-prefix=PARSER %s ; RUN: llc -mtriple=amdgcn-amd-amdhsa -mcpu=gfx900 -amdgpu-dump-hsa-metadata -amdgpu-verify-hsa-metadata -filetype=obj -o - < %s 2>&1 | FileCheck --check-prefix=PARSER %s @@ -21,15 +24,16 @@ ; CHECK: Kernels: ; CHECK: - Name: test_char +; CHECK-NEXT: SymbolName: 'test_char@kd' ; CHECK-NEXT: Language: OpenCL C ; CHECK-NEXT: LanguageVersion: [ 2, 0 ] ; CHECK-NEXT: Args: -; CHECK-NEXT: - Size: 1 +; CHECK-NEXT: - TypeName: char +; CHECK-NEXT: Size: 1 ; CHECK-NEXT: Align: 1 ; CHECK-NEXT: ValueKind: ByValue ; CHECK-NEXT: ValueType: I8 ; CHECK-NEXT: AccQual: Default -; CHECK-NEXT: TypeName: char ; CHECK-NEXT: - Size: 8 ; CHECK-NEXT: Align: 8 ; CHECK-NEXT: ValueKind: HiddenGlobalOffsetX @@ -54,15 +58,16 @@ define amdgpu_kernel void @test_char(i8 %a) } ; CHECK: - Name: test_ushort2 +; CHECK-NEXT: SymbolName: 'test_ushort2@kd' ; CHECK-NEXT: Language: OpenCL C ; CHECK-NEXT: LanguageVersion: [ 2, 0 ] ; CHECK-NEXT: Args: -; CHECK-NEXT: - Size: 4 +; CHECK-NEXT: - TypeName: ushort2 +; CHECK-NEXT: Size: 4 ; CHECK-NEXT: Align: 4 ; CHECK-NEXT: ValueKind: ByValue ; CHECK-NEXT: ValueType: U16 ; CHECK-NEXT: AccQual: Default -; CHECK-NEXT: TypeName: ushort2 ; CHECK-NEXT: - Size: 8 ; CHECK-NEXT: Align: 8 ; CHECK-NEXT: ValueKind: HiddenGlobalOffsetX @@ -87,15 +92,16 @@ define amdgpu_kernel void @test_ushort2(<2 x i16> %a) } ; CHECK: - Name: test_int3 +; CHECK-NEXT: SymbolName: 'test_int3@kd' ; CHECK-NEXT: Language: OpenCL C ; CHECK-NEXT: LanguageVersion: [ 2, 0 ] ; CHECK-NEXT: Args: -; CHECK-NEXT: - Size: 16 +; CHECK-NEXT: - TypeName: int3 +; CHECK-NEXT: Size: 16 ; CHECK-NEXT: Align: 16 ; CHECK-NEXT: ValueKind: ByValue ; CHECK-NEXT: ValueType: I32 ; CHECK-NEXT: AccQual: Default -; CHECK-NEXT: TypeName: int3 ; CHECK-NEXT: - Size: 8 ; CHECK-NEXT: Align: 8 ; CHECK-NEXT: ValueKind: HiddenGlobalOffsetX @@ -120,15 +126,16 @@ define amdgpu_kernel void @test_int3(<3 x i32> %a) } ; CHECK: - Name: test_ulong4 +; CHECK-NEXT: SymbolName: 'test_ulong4@kd' ; CHECK-NEXT: Language: OpenCL C ; CHECK-NEXT: LanguageVersion: [ 2, 0 ] ; CHECK-NEXT: Args: -; CHECK-NEXT: - Size: 32 +; CHECK-NEXT: - TypeName: ulong4 +; CHECK-NEXT: Size: 32 ; CHECK-NEXT: Align: 32 ; CHECK-NEXT: ValueKind: ByValue ; CHECK-NEXT: ValueType: U64 ; CHECK-NEXT: AccQual: Default -; CHECK-NEXT: TypeName: ulong4 ; CHECK-NEXT: - Size: 8 ; CHECK-NEXT: Align: 8 ; CHECK-NEXT: ValueKind: HiddenGlobalOffsetX @@ -153,15 +160,16 @@ define amdgpu_kernel void @test_ulong4(<4 x i64> %a) } ; CHECK: - Name: test_half8 +; CHECK-NEXT: SymbolName: 'test_half8@kd' ; CHECK-NEXT: Language: OpenCL C ; CHECK-NEXT: LanguageVersion: [ 2, 0 ] ; CHECK-NEXT: Args: -; CHECK-NEXT: - Size: 16 +; CHECK-NEXT: - TypeName: half8 +; CHECK-NEXT: Size: 16 ; CHECK-NEXT: Align: 16 ; CHECK-NEXT: ValueKind: ByValue ; CHECK-NEXT: ValueType: F16 ; CHECK-NEXT: AccQual: Default -; CHECK-NEXT: TypeName: half8 ; CHECK-NEXT: - Size: 8 ; CHECK-NEXT: Align: 8 ; CHECK-NEXT: ValueKind: HiddenGlobalOffsetX @@ -186,15 +194,16 @@ define amdgpu_kernel void @test_half8(<8 x half> %a) } ; CHECK: - Name: test_float16 +; CHECK-NEXT: SymbolName: 'test_float16@kd' ; CHECK-NEXT: Language: OpenCL C ; CHECK-NEXT: LanguageVersion: [ 2, 0 ] ; CHECK-NEXT: Args: -; CHECK-NEXT: - Size: 64 +; CHECK-NEXT: - TypeName: float16 +; CHECK-NEXT: Size: 64 ; CHECK-NEXT: Align: 64 ; CHECK-NEXT: ValueKind: ByValue ; CHECK-NEXT: ValueType: F32 ; CHECK-NEXT: AccQual: Default -; CHECK-NEXT: TypeName: float16 ; CHECK-NEXT: - Size: 8 ; CHECK-NEXT: Align: 8 ; CHECK-NEXT: ValueKind: HiddenGlobalOffsetX @@ -219,15 +228,16 @@ define amdgpu_kernel void @test_float16(<16 x float> %a) } ; CHECK: - Name: test_double16 +; CHECK-NEXT: SymbolName: 'test_double16@kd' ; CHECK-NEXT: Language: OpenCL C ; CHECK-NEXT: LanguageVersion: [ 2, 0 ] ; CHECK-NEXT: Args: -; CHECK-NEXT: - Size: 128 +; CHECK-NEXT: - TypeName: double16 +; CHECK-NEXT: Size: 128 ; CHECK-NEXT: Align: 128 ; CHECK-NEXT: ValueKind: ByValue ; CHECK-NEXT: ValueType: F64 ; CHECK-NEXT: AccQual: Default -; CHECK-NEXT: TypeName: double16 ; CHECK-NEXT: - Size: 8 ; CHECK-NEXT: Align: 8 ; CHECK-NEXT: ValueKind: HiddenGlobalOffsetX @@ -252,16 +262,17 @@ define amdgpu_kernel void @test_double16(<16 x double> %a) } ; CHECK: - Name: test_pointer +; CHECK-NEXT: SymbolName: 'test_pointer@kd' ; CHECK-NEXT: Language: OpenCL C ; CHECK-NEXT: LanguageVersion: [ 2, 0 ] ; CHECK-NEXT: Args: -; CHECK-NEXT: - Size: 8 +; CHECK-NEXT: - TypeName: 'int *' +; CHECK-NEXT: Size: 8 ; CHECK-NEXT: Align: 8 ; CHECK-NEXT: ValueKind: GlobalBuffer ; CHECK-NEXT: ValueType: I32 -; CHECK-NEXT: AccQual: Default ; CHECK-NEXT: AddrSpaceQual: Global -; CHECK-NEXT: TypeName: 'int *' +; CHECK-NEXT: AccQual: Default ; CHECK-NEXT: - Size: 8 ; CHECK-NEXT: Align: 8 ; CHECK-NEXT: ValueKind: HiddenGlobalOffsetX @@ -286,16 +297,17 @@ define amdgpu_kernel void @test_pointer(i32 addrspace(1)* %a) } ; CHECK: - Name: test_image +; CHECK-NEXT: SymbolName: 'test_image@kd' ; CHECK-NEXT: Language: OpenCL C ; CHECK-NEXT: LanguageVersion: [ 2, 0 ] ; CHECK-NEXT: Args: -; CHECK-NEXT: - Size: 8 +; CHECK-NEXT: - TypeName: image2d_t +; CHECK-NEXT: Size: 8 ; CHECK-NEXT: Align: 8 ; CHECK-NEXT: ValueKind: Image ; CHECK-NEXT: ValueType: Struct -; CHECK-NEXT: AccQual: Default ; CHECK-NEXT: AddrSpaceQual: Global -; CHECK-NEXT: TypeName: image2d_t +; CHECK-NEXT: AccQual: Default ; CHECK-NEXT: - Size: 8 ; CHECK-NEXT: Align: 8 ; CHECK-NEXT: ValueKind: HiddenGlobalOffsetX @@ -320,15 +332,16 @@ define amdgpu_kernel void @test_image(%opencl.image2d_t addrspace(1)* %a) } ; CHECK: - Name: test_sampler +; CHECK-NEXT: SymbolName: 'test_sampler@kd' ; CHECK-NEXT: Language: OpenCL C ; CHECK-NEXT: LanguageVersion: [ 2, 0 ] ; CHECK-NEXT: Args: -; CHECK-NEXT: - Size: 4 +; CHECK-NEXT: - TypeName: sampler_t +; CHECK-NEXT: Size: 4 ; CHECK-NEXT: Align: 4 ; CHECK-NEXT: ValueKind: Sampler ; CHECK-NEXT: ValueType: I32 ; CHECK-NEXT: AccQual: Default -; CHECK-NEXT: TypeName: sampler_t ; CHECK-NEXT: - Size: 8 ; CHECK-NEXT: Align: 8 ; CHECK-NEXT: ValueKind: HiddenGlobalOffsetX @@ -353,16 +366,17 @@ define amdgpu_kernel void @test_sampler(i32 %a) } ; CHECK: - Name: test_queue +; CHECK-NEXT: SymbolName: 'test_queue@kd' ; CHECK-NEXT: Language: OpenCL C ; CHECK-NEXT: LanguageVersion: [ 2, 0 ] ; CHECK-NEXT: Args: -; CHECK-NEXT: - Size: 8 +; CHECK-NEXT: - TypeName: queue_t +; CHECK-NEXT: Size: 8 ; CHECK-NEXT: Align: 8 ; CHECK-NEXT: ValueKind: Queue ; CHECK-NEXT: ValueType: Struct -; CHECK-NEXT: AccQual: Default ; CHECK-NEXT: AddrSpaceQual: Global -; CHECK-NEXT: TypeName: queue_t +; CHECK-NEXT: AccQual: Default ; CHECK-NEXT: - Size: 8 ; CHECK-NEXT: Align: 8 ; CHECK-NEXT: ValueKind: HiddenGlobalOffsetX @@ -387,16 +401,17 @@ define amdgpu_kernel void @test_queue(%opencl.queue_t addrspace(1)* %a) } ; CHECK: - Name: test_struct +; CHECK-NEXT: SymbolName: 'test_struct@kd' ; CHECK-NEXT: Language: OpenCL C ; CHECK-NEXT: LanguageVersion: [ 2, 0 ] ; CHECK-NEXT: Args: -; CHECK-NEXT: - Size: 4 +; CHECK-NEXT: - TypeName: struct A +; CHECK-NEXT: Size: 4 ; CHECK-NEXT: Align: 4 ; CHECK-NEXT: ValueKind: GlobalBuffer ; CHECK-NEXT: ValueType: Struct -; CHECK-NEXT: AccQual: Default ; CHECK-NEXT: AddrSpaceQual: Private -; CHECK-NEXT: TypeName: struct A +; CHECK-NEXT: AccQual: Default ; CHECK-NEXT: - Size: 8 ; CHECK-NEXT: Align: 8 ; CHECK-NEXT: ValueKind: HiddenGlobalOffsetX @@ -421,15 +436,16 @@ define amdgpu_kernel void @test_struct(%struct.A* byval %a) } ; CHECK: - Name: test_i128 +; CHECK-NEXT: SymbolName: 'test_i128@kd' ; CHECK-NEXT: Language: OpenCL C ; CHECK-NEXT: LanguageVersion: [ 2, 0 ] ; CHECK-NEXT: Args: -; CHECK-NEXT: - Size: 16 +; CHECK-NEXT: - TypeName: i128 +; CHECK-NEXT: Size: 16 ; CHECK-NEXT: Align: 8 ; CHECK-NEXT: ValueKind: ByValue ; CHECK-NEXT: ValueType: Struct ; CHECK-NEXT: AccQual: Default -; CHECK-NEXT: TypeName: i128 ; CHECK-NEXT: - Size: 8 ; CHECK-NEXT: Align: 8 ; CHECK-NEXT: ValueKind: HiddenGlobalOffsetX @@ -454,27 +470,28 @@ define amdgpu_kernel void @test_i128(i128 %a) } ; CHECK: - Name: test_multi_arg +; CHECK-NEXT: SymbolName: 'test_multi_arg@kd' ; CHECK-NEXT: Language: OpenCL C ; CHECK-NEXT: LanguageVersion: [ 2, 0 ] ; CHECK-NEXT: Args: -; CHECK-NEXT: - Size: 4 +; CHECK-NEXT: - TypeName: int +; CHECK-NEXT: Size: 4 ; CHECK-NEXT: Align: 4 ; CHECK-NEXT: ValueKind: ByValue ; CHECK-NEXT: ValueType: I32 ; CHECK-NEXT: AccQual: Default -; CHECK-NEXT: TypeName: int -; CHECK-NEXT: - Size: 4 +; CHECK-NEXT: - TypeName: short2 +; CHECK-NEXT: Size: 4 ; CHECK-NEXT: Align: 4 ; CHECK-NEXT: ValueKind: ByValue ; CHECK-NEXT: ValueType: I16 ; CHECK-NEXT: AccQual: Default -; CHECK-NEXT: TypeName: short2 -; CHECK-NEXT: - Size: 4 +; CHECK-NEXT: - TypeName: char3 +; CHECK-NEXT: Size: 4 ; CHECK-NEXT: Align: 4 ; CHECK-NEXT: ValueKind: ByValue ; CHECK-NEXT: ValueType: I8 ; CHECK-NEXT: AccQual: Default -; CHECK-NEXT: TypeName: char3 ; CHECK-NEXT: - Size: 8 ; CHECK-NEXT: Align: 8 ; CHECK-NEXT: ValueKind: HiddenGlobalOffsetX @@ -499,31 +516,32 @@ define amdgpu_kernel void @test_multi_arg(i32 %a, <2 x i16> %b, <3 x i8> %c) } ; CHECK: - Name: test_addr_space +; CHECK-NEXT: SymbolName: 'test_addr_space@kd' ; CHECK-NEXT: Language: OpenCL C ; CHECK-NEXT: LanguageVersion: [ 2, 0 ] ; CHECK-NEXT: Args: -; CHECK-NEXT: - Size: 8 +; CHECK-NEXT: - TypeName: 'int *' +; CHECK-NEXT: Size: 8 ; CHECK-NEXT: Align: 8 ; CHECK-NEXT: ValueKind: GlobalBuffer ; CHECK-NEXT: ValueType: I32 -; CHECK-NEXT: AccQual: Default ; CHECK-NEXT: AddrSpaceQual: Global -; CHECK-NEXT: TypeName: 'int *' -; CHECK-NEXT: - Size: 8 +; CHECK-NEXT: AccQual: Default +; CHECK-NEXT: - TypeName: 'int *' +; CHECK-NEXT: Size: 8 ; CHECK-NEXT: Align: 8 ; CHECK-NEXT: ValueKind: GlobalBuffer ; CHECK-NEXT: ValueType: I32 -; CHECK-NEXT: AccQual: Default ; CHECK-NEXT: AddrSpaceQual: Constant -; CHECK-NEXT: TypeName: 'int *' -; CHECK-NEXT: - Size: 4 +; CHECK-NEXT: AccQual: Default +; CHECK-NEXT: - TypeName: 'int *' +; CHECK-NEXT: Size: 4 ; CHECK-NEXT: Align: 4 ; CHECK-NEXT: ValueKind: DynamicSharedPointer ; CHECK-NEXT: ValueType: I32 ; CHECK-NEXT: PointeeAlign: 4 -; CHECK-NEXT: AccQual: Default ; CHECK-NEXT: AddrSpaceQual: Local -; CHECK-NEXT: TypeName: 'int *' +; CHECK-NEXT: AccQual: Default ; CHECK-NEXT: - Size: 8 ; CHECK-NEXT: Align: 8 ; CHECK-NEXT: ValueKind: HiddenGlobalOffsetX @@ -550,34 +568,35 @@ define amdgpu_kernel void @test_addr_space(i32 addrspace(1)* %g, } ; CHECK: - Name: test_type_qual +; CHECK-NEXT: SymbolName: 'test_type_qual@kd' ; CHECK-NEXT: Language: OpenCL C ; CHECK-NEXT: LanguageVersion: [ 2, 0 ] ; CHECK-NEXT: Args: -; CHECK-NEXT: - Size: 8 +; CHECK-NEXT: - TypeName: 'int *' +; CHECK-NEXT: Size: 8 ; CHECK-NEXT: Align: 8 ; CHECK-NEXT: ValueKind: GlobalBuffer ; CHECK-NEXT: ValueType: I32 -; CHECK-NEXT: AccQual: Default ; CHECK-NEXT: AddrSpaceQual: Global +; CHECK-NEXT: AccQual: Default ; CHECK-NEXT: IsVolatile: true -; CHECK-NEXT: TypeName: 'int *' -; CHECK-NEXT: - Size: 8 +; CHECK-NEXT: - TypeName: 'int *' +; CHECK-NEXT: Size: 8 ; CHECK-NEXT: Align: 8 ; CHECK-NEXT: ValueKind: GlobalBuffer ; CHECK-NEXT: ValueType: I32 -; CHECK-NEXT: AccQual: Default ; CHECK-NEXT: AddrSpaceQual: Global +; CHECK-NEXT: AccQual: Default ; CHECK-NEXT: IsConst: true ; CHECK-NEXT: IsRestrict: true -; CHECK-NEXT: TypeName: 'int *' -; CHECK-NEXT: - Size: 8 +; CHECK-NEXT: - TypeName: 'int *' +; CHECK-NEXT: Size: 8 ; CHECK-NEXT: Align: 8 ; CHECK-NEXT: ValueKind: Pipe ; CHECK-NEXT: ValueType: Struct -; CHECK-NEXT: AccQual: Default ; CHECK-NEXT: AddrSpaceQual: Global +; CHECK-NEXT: AccQual: Default ; CHECK-NEXT: IsPipe: true -; CHECK-NEXT: TypeName: 'int *' ; CHECK-NEXT: - Size: 8 ; CHECK-NEXT: Align: 8 ; CHECK-NEXT: ValueKind: HiddenGlobalOffsetX @@ -604,30 +623,31 @@ define amdgpu_kernel void @test_type_qual(i32 addrspace(1)* %a, } ; CHECK: - Name: test_access_qual +; CHECK-NEXT: SymbolName: 'test_access_qual@kd' ; CHECK-NEXT: Language: OpenCL C ; CHECK-NEXT: LanguageVersion: [ 2, 0 ] ; CHECK-NEXT: Args: -; CHECK-NEXT: - Size: 8 +; CHECK-NEXT: - TypeName: image1d_t +; CHECK-NEXT: Size: 8 ; CHECK-NEXT: Align: 8 ; CHECK-NEXT: ValueKind: Image ; CHECK-NEXT: ValueType: Struct -; CHECK-NEXT: AccQual: ReadOnly ; CHECK-NEXT: AddrSpaceQual: Global -; CHECK-NEXT: TypeName: image1d_t -; CHECK-NEXT: - Size: 8 +; CHECK-NEXT: AccQual: ReadOnly +; CHECK-NEXT: - TypeName: image2d_t +; CHECK-NEXT: Size: 8 ; CHECK-NEXT: Align: 8 ; CHECK-NEXT: ValueKind: Image ; CHECK-NEXT: ValueType: Struct -; CHECK-NEXT: AccQual: WriteOnly ; CHECK-NEXT: AddrSpaceQual: Global -; CHECK-NEXT: TypeName: image2d_t -; CHECK-NEXT: - Size: 8 +; CHECK-NEXT: AccQual: WriteOnly +; CHECK-NEXT: - TypeName: image3d_t +; CHECK-NEXT: Size: 8 ; CHECK-NEXT: Align: 8 ; CHECK-NEXT: ValueKind: Image ; CHECK-NEXT: ValueType: Struct -; CHECK-NEXT: AccQual: ReadWrite ; CHECK-NEXT: AddrSpaceQual: Global -; CHECK-NEXT: TypeName: image3d_t +; CHECK-NEXT: AccQual: ReadWrite ; CHECK-NEXT: - Size: 8 ; CHECK-NEXT: Align: 8 ; CHECK-NEXT: ValueKind: HiddenGlobalOffsetX @@ -654,17 +674,18 @@ define amdgpu_kernel void @test_access_qual(%opencl.image1d_t addrspace(1)* %ro, } ; CHECK: - Name: test_vec_type_hint_half +; CHECK-NEXT: SymbolName: 'test_vec_type_hint_half@kd' ; CHECK-NEXT: Language: OpenCL C ; CHECK-NEXT: LanguageVersion: [ 2, 0 ] ; CHECK-NEXT: Attrs: ; CHECK-NEXT: VecTypeHint: half ; CHECK-NEXT: Args: -; CHECK-NEXT: - Size: 4 +; CHECK-NEXT: - TypeName: int +; CHECK-NEXT: Size: 4 ; CHECK-NEXT: Align: 4 ; CHECK-NEXT: ValueKind: ByValue ; CHECK-NEXT: ValueType: I32 ; CHECK-NEXT: AccQual: Default -; CHECK-NEXT: TypeName: int ; CHECK-NEXT: - Size: 8 ; CHECK-NEXT: Align: 8 ; CHECK-NEXT: ValueKind: HiddenGlobalOffsetX @@ -689,17 +710,18 @@ define amdgpu_kernel void @test_vec_type_hint_half(i32 %a) } ; CHECK: - Name: test_vec_type_hint_float +; CHECK-NEXT: SymbolName: 'test_vec_type_hint_float@kd' ; CHECK-NEXT: Language: OpenCL C ; CHECK-NEXT: LanguageVersion: [ 2, 0 ] ; CHECK-NEXT: Attrs: ; CHECK-NEXT: VecTypeHint: float ; CHECK-NEXT: Args: -; CHECK-NEXT: - Size: 4 +; CHECK-NEXT: - TypeName: int +; CHECK-NEXT: Size: 4 ; CHECK-NEXT: Align: 4 ; CHECK-NEXT: ValueKind: ByValue ; CHECK-NEXT: ValueType: I32 ; CHECK-NEXT: AccQual: Default -; CHECK-NEXT: TypeName: int ; CHECK-NEXT: - Size: 8 ; CHECK-NEXT: Align: 8 ; CHECK-NEXT: ValueKind: HiddenGlobalOffsetX @@ -724,17 +746,18 @@ define amdgpu_kernel void @test_vec_type_hint_float(i32 %a) } ; CHECK: - Name: test_vec_type_hint_double +; CHECK-NEXT: SymbolName: 'test_vec_type_hint_double@kd' ; CHECK-NEXT: Language: OpenCL C ; CHECK-NEXT: LanguageVersion: [ 2, 0 ] ; CHECK-NEXT: Attrs: ; CHECK-NEXT: VecTypeHint: double ; CHECK-NEXT: Args: -; CHECK-NEXT: - Size: 4 +; CHECK-NEXT: - TypeName: int +; CHECK-NEXT: Size: 4 ; CHECK-NEXT: Align: 4 ; CHECK-NEXT: ValueKind: ByValue ; CHECK-NEXT: ValueType: I32 ; CHECK-NEXT: AccQual: Default -; CHECK-NEXT: TypeName: int ; CHECK-NEXT: - Size: 8 ; CHECK-NEXT: Align: 8 ; CHECK-NEXT: ValueKind: HiddenGlobalOffsetX @@ -759,17 +782,18 @@ define amdgpu_kernel void @test_vec_type_hint_double(i32 %a) } ; CHECK: - Name: test_vec_type_hint_char +; CHECK-NEXT: SymbolName: 'test_vec_type_hint_char@kd' ; CHECK-NEXT: Language: OpenCL C ; CHECK-NEXT: LanguageVersion: [ 2, 0 ] ; CHECK-NEXT: Attrs: ; CHECK-NEXT: VecTypeHint: char ; CHECK-NEXT: Args: -; CHECK-NEXT: - Size: 4 +; CHECK-NEXT: - TypeName: int +; CHECK-NEXT: Size: 4 ; CHECK-NEXT: Align: 4 ; CHECK-NEXT: ValueKind: ByValue ; CHECK-NEXT: ValueType: I32 ; CHECK-NEXT: AccQual: Default -; CHECK-NEXT: TypeName: int ; CHECK-NEXT: - Size: 8 ; CHECK-NEXT: Align: 8 ; CHECK-NEXT: ValueKind: HiddenGlobalOffsetX @@ -794,17 +818,18 @@ define amdgpu_kernel void @test_vec_type_hint_char(i32 %a) } ; CHECK: - Name: test_vec_type_hint_short +; CHECK-NEXT: SymbolName: 'test_vec_type_hint_short@kd' ; CHECK-NEXT: Language: OpenCL C ; CHECK-NEXT: LanguageVersion: [ 2, 0 ] ; CHECK-NEXT: Attrs: ; CHECK-NEXT: VecTypeHint: short ; CHECK-NEXT: Args: -; CHECK-NEXT: - Size: 4 +; CHECK-NEXT: - TypeName: int +; CHECK-NEXT: Size: 4 ; CHECK-NEXT: Align: 4 ; CHECK-NEXT: ValueKind: ByValue ; CHECK-NEXT: ValueType: I32 ; CHECK-NEXT: AccQual: Default -; CHECK-NEXT: TypeName: int ; CHECK-NEXT: - Size: 8 ; CHECK-NEXT: Align: 8 ; CHECK-NEXT: ValueKind: HiddenGlobalOffsetX @@ -829,17 +854,18 @@ define amdgpu_kernel void @test_vec_type_hint_short(i32 %a) } ; CHECK: - Name: test_vec_type_hint_long +; CHECK-NEXT: SymbolName: 'test_vec_type_hint_long@kd' ; CHECK-NEXT: Language: OpenCL C ; CHECK-NEXT: LanguageVersion: [ 2, 0 ] ; CHECK-NEXT: Attrs: ; CHECK-NEXT: VecTypeHint: long ; CHECK-NEXT: Args: -; CHECK-NEXT: - Size: 4 +; CHECK-NEXT: - TypeName: int +; CHECK-NEXT: Size: 4 ; CHECK-NEXT: Align: 4 ; CHECK-NEXT: ValueKind: ByValue ; CHECK-NEXT: ValueType: I32 ; CHECK-NEXT: AccQual: Default -; CHECK-NEXT: TypeName: int ; CHECK-NEXT: - Size: 8 ; CHECK-NEXT: Align: 8 ; CHECK-NEXT: ValueKind: HiddenGlobalOffsetX @@ -864,17 +890,18 @@ define amdgpu_kernel void @test_vec_type_hint_long(i32 %a) } ; CHECK: - Name: test_vec_type_hint_unknown +; CHECK-NEXT: SymbolName: 'test_vec_type_hint_unknown@kd' ; CHECK-NEXT: Language: OpenCL C ; CHECK-NEXT: LanguageVersion: [ 2, 0 ] ; CHECK-NEXT: Attrs: ; CHECK-NEXT: VecTypeHint: unknown ; CHECK-NEXT: Args: -; CHECK-NEXT: - Size: 4 +; CHECK-NEXT: - TypeName: int +; CHECK-NEXT: Size: 4 ; CHECK-NEXT: Align: 4 ; CHECK-NEXT: ValueKind: ByValue ; CHECK-NEXT: ValueType: I32 ; CHECK-NEXT: AccQual: Default -; CHECK-NEXT: TypeName: int ; CHECK-NEXT: - Size: 8 ; CHECK-NEXT: Align: 8 ; CHECK-NEXT: ValueKind: HiddenGlobalOffsetX @@ -899,18 +926,19 @@ define amdgpu_kernel void @test_vec_type_hint_unknown(i32 %a) } ; CHECK: - Name: test_reqd_wgs_vec_type_hint +; CHECK-NEXT: SymbolName: 'test_reqd_wgs_vec_type_hint@kd' ; CHECK-NEXT: Language: OpenCL C ; CHECK-NEXT: LanguageVersion: [ 2, 0 ] ; CHECK-NEXT: Attrs: ; CHECK-NEXT: ReqdWorkGroupSize: [ 1, 2, 4 ] ; CHECK-NEXT: VecTypeHint: int ; CHECK-NEXT: Args: -; CHECK-NEXT: - Size: 4 +; CHECK-NEXT: - TypeName: int +; CHECK-NEXT: Size: 4 ; CHECK-NEXT: Align: 4 ; CHECK-NEXT: ValueKind: ByValue ; CHECK-NEXT: ValueType: I32 ; CHECK-NEXT: AccQual: Default -; CHECK-NEXT: TypeName: int ; CHECK-NEXT: - Size: 8 ; CHECK-NEXT: Align: 8 ; CHECK-NEXT: ValueKind: HiddenGlobalOffsetX @@ -936,18 +964,19 @@ define amdgpu_kernel void @test_reqd_wgs_vec_type_hint(i32 %a) } ; CHECK: - Name: test_wgs_hint_vec_type_hint +; CHECK-NEXT: SymbolName: 'test_wgs_hint_vec_type_hint@kd' ; CHECK-NEXT: Language: OpenCL C ; CHECK-NEXT: LanguageVersion: [ 2, 0 ] ; CHECK-NEXT: Attrs: ; CHECK-NEXT: WorkGroupSizeHint: [ 8, 16, 32 ] ; CHECK-NEXT: VecTypeHint: uint4 ; CHECK-NEXT: Args: -; CHECK-NEXT: - Size: 4 +; CHECK-NEXT: - TypeName: int +; CHECK-NEXT: Size: 4 ; CHECK-NEXT: Align: 4 ; CHECK-NEXT: ValueKind: ByValue ; CHECK-NEXT: ValueType: I32 ; CHECK-NEXT: AccQual: Default -; CHECK-NEXT: TypeName: int ; CHECK-NEXT: - Size: 8 ; CHECK-NEXT: Align: 8 ; CHECK-NEXT: ValueKind: HiddenGlobalOffsetX @@ -973,16 +1002,17 @@ define amdgpu_kernel void @test_wgs_hint_vec_type_hint(i32 %a) } ; CHECK: - Name: test_arg_ptr_to_ptr +; CHECK-NEXT: SymbolName: 'test_arg_ptr_to_ptr@kd' ; CHECK-NEXT: Language: OpenCL C ; CHECK-NEXT: LanguageVersion: [ 2, 0 ] ; CHECK-NEXT: Args: -; CHECK-NEXT: - Size: 8 +; CHECK-NEXT: - TypeName: 'int **' +; CHECK-NEXT: Size: 8 ; CHECK-NEXT: Align: 8 ; CHECK-NEXT: ValueKind: GlobalBuffer ; CHECK-NEXT: ValueType: I32 -; CHECK-NEXT: AccQual: Default ; CHECK-NEXT: AddrSpaceQual: Global -; CHECK-NEXT: TypeName: 'int **' +; CHECK-NEXT: AccQual: Default ; CHECK-NEXT: - Size: 8 ; CHECK-NEXT: Align: 8 ; CHECK-NEXT: ValueKind: HiddenGlobalOffsetX @@ -1007,16 +1037,17 @@ define amdgpu_kernel void @test_arg_ptr_to_ptr(i32* addrspace(1)* %a) } ; CHECK: - Name: test_arg_struct_contains_ptr +; CHECK-NEXT: SymbolName: 'test_arg_struct_contains_ptr@kd' ; CHECK-NEXT: Language: OpenCL C ; CHECK-NEXT: LanguageVersion: [ 2, 0 ] ; CHECK-NEXT: Args: -; CHECK-NEXT: - Size: 4 +; CHECK-NEXT: - TypeName: struct B +; CHECK-NEXT: Size: 4 ; CHECK-NEXT: Align: 4 ; CHECK-NEXT: ValueKind: GlobalBuffer ; CHECK-NEXT: ValueType: Struct -; CHECK-NEXT: AccQual: Default ; CHECK-NEXT: AddrSpaceQual: Private -; CHECK-NEXT: TypeName: struct B +; CHECK-NEXT: AccQual: Default ; CHECK-NEXT: - Size: 8 ; CHECK-NEXT: Align: 8 ; CHECK-NEXT: ValueKind: HiddenGlobalOffsetX @@ -1041,15 +1072,16 @@ define amdgpu_kernel void @test_arg_struct_contains_ptr(%struct.B* byval %a) } ; CHECK: - Name: test_arg_vector_of_ptr +; CHECK-NEXT: SymbolName: 'test_arg_vector_of_ptr@kd' ; CHECK-NEXT: Language: OpenCL C ; CHECK-NEXT: LanguageVersion: [ 2, 0 ] ; CHECK-NEXT: Args: -; CHECK-NEXT: - Size: 16 +; CHECK-NEXT: - TypeName: 'global int* __attribute__((ext_vector_type(2)))' +; CHECK-NEXT: Size: 16 ; CHECK-NEXT: Align: 16 ; CHECK-NEXT: ValueKind: ByValue ; CHECK-NEXT: ValueType: I32 ; CHECK-NEXT: AccQual: Default -; CHECK-NEXT: TypeName: 'global int* __attribute__((ext_vector_type(2)))' ; CHECK-NEXT: - Size: 8 ; CHECK-NEXT: Align: 8 ; CHECK-NEXT: ValueKind: HiddenGlobalOffsetX @@ -1074,16 +1106,17 @@ define amdgpu_kernel void @test_arg_vector_of_ptr(<2 x i32 addrspace(1)*> %a) } ; CHECK: - Name: test_arg_unknown_builtin_type +; CHECK-NEXT: SymbolName: 'test_arg_unknown_builtin_type@kd' ; CHECK-NEXT: Language: OpenCL C ; CHECK-NEXT: LanguageVersion: [ 2, 0 ] ; CHECK-NEXT: Args: -; CHECK-NEXT: - Size: 8 +; CHECK-NEXT: - TypeName: clk_event_t +; CHECK-NEXT: Size: 8 ; CHECK-NEXT: Align: 8 ; CHECK-NEXT: ValueKind: GlobalBuffer ; CHECK-NEXT: ValueType: Struct -; CHECK-NEXT: AccQual: Default ; CHECK-NEXT: AddrSpaceQual: Global -; CHECK-NEXT: TypeName: clk_event_t +; CHECK-NEXT: AccQual: Default ; CHECK-NEXT: - Size: 8 ; CHECK-NEXT: Align: 8 ; CHECK-NEXT: ValueKind: HiddenGlobalOffsetX @@ -1109,64 +1142,65 @@ define amdgpu_kernel void @test_arg_unknown_builtin_type( } ; CHECK: - Name: test_pointee_align +; CHECK-NEXT: SymbolName: 'test_pointee_align@kd' ; CHECK-NEXT: Language: OpenCL C ; CHECK-NEXT: LanguageVersion: [ 2, 0 ] ; CHECK-NEXT: Args: -; CHECK-NEXT: - Size: 8 +; CHECK-NEXT: - TypeName: 'long *' +; CHECK-NEXT: Size: 8 ; CHECK-NEXT: Align: 8 ; CHECK-NEXT: ValueKind: GlobalBuffer ; CHECK-NEXT: ValueType: I64 -; CHECK-NEXT: AccQual: Default ; CHECK-NEXT: AddrSpaceQual: Global -; CHECK-NEXT: TypeName: 'long *' -; CHECK-NEXT: - Size: 4 +; CHECK-NEXT: AccQual: Default +; CHECK-NEXT: - TypeName: 'char *' +; CHECK-NEXT: Size: 4 ; CHECK-NEXT: Align: 4 ; CHECK-NEXT: ValueKind: DynamicSharedPointer ; CHECK-NEXT: ValueType: I8 ; CHECK-NEXT: PointeeAlign: 1 -; CHECK-NEXT: AccQual: Default ; CHECK-NEXT: AddrSpaceQual: Local -; CHECK-NEXT: TypeName: 'char *' -; CHECK-NEXT: - Size: 4 +; CHECK-NEXT: AccQual: Default +; CHECK-NEXT: - TypeName: 'char2 *' +; CHECK-NEXT: Size: 4 ; CHECK-NEXT: Align: 4 ; CHECK-NEXT: ValueKind: DynamicSharedPointer ; CHECK-NEXT: ValueType: I8 ; CHECK-NEXT: PointeeAlign: 2 -; CHECK-NEXT: AccQual: Default ; CHECK-NEXT: AddrSpaceQual: Local -; CHECK-NEXT: TypeName: 'char2 *' -; CHECK-NEXT: - Size: 4 +; CHECK-NEXT: AccQual: Default +; CHECK-NEXT: - TypeName: 'char3 *' +; CHECK-NEXT: Size: 4 ; CHECK-NEXT: Align: 4 ; CHECK-NEXT: ValueKind: DynamicSharedPointer ; CHECK-NEXT: ValueType: I8 ; CHECK-NEXT: PointeeAlign: 4 -; CHECK-NEXT: AccQual: Default ; CHECK-NEXT: AddrSpaceQual: Local -; CHECK-NEXT: TypeName: 'char3 *' -; CHECK-NEXT: - Size: 4 +; CHECK-NEXT: AccQual: Default +; CHECK-NEXT: - TypeName: 'char4 *' +; CHECK-NEXT: Size: 4 ; CHECK-NEXT: Align: 4 ; CHECK-NEXT: ValueKind: DynamicSharedPointer ; CHECK-NEXT: ValueType: I8 ; CHECK-NEXT: PointeeAlign: 4 -; CHECK-NEXT: AccQual: Default ; CHECK-NEXT: AddrSpaceQual: Local -; CHECK-NEXT: TypeName: 'char4 *' -; CHECK-NEXT: - Size: 4 +; CHECK-NEXT: AccQual: Default +; CHECK-NEXT: - TypeName: 'char8 *' +; CHECK-NEXT: Size: 4 ; CHECK-NEXT: Align: 4 ; CHECK-NEXT: ValueKind: DynamicSharedPointer ; CHECK-NEXT: ValueType: I8 ; CHECK-NEXT: PointeeAlign: 8 -; CHECK-NEXT: AccQual: Default ; CHECK-NEXT: AddrSpaceQual: Local -; CHECK-NEXT: TypeName: 'char8 *' -; CHECK-NEXT: - Size: 4 +; CHECK-NEXT: AccQual: Default +; CHECK-NEXT: - TypeName: 'char16 *' +; CHECK-NEXT: Size: 4 ; CHECK-NEXT: Align: 4 ; CHECK-NEXT: ValueKind: DynamicSharedPointer ; CHECK-NEXT: ValueType: I8 ; CHECK-NEXT: PointeeAlign: 16 -; CHECK-NEXT: AccQual: Default ; CHECK-NEXT: AddrSpaceQual: Local -; CHECK-NEXT: TypeName: 'char16 *' +; CHECK-NEXT: AccQual: Default ; CHECK-NEXT: - Size: 8 ; CHECK-NEXT: Align: 8 ; CHECK-NEXT: ValueKind: HiddenGlobalOffsetX @@ -1197,17 +1231,18 @@ define amdgpu_kernel void @test_pointee_align(i64 addrspace(1)* %a, } ; CHECK: - Name: __test_block_invoke_kernel +; CHECK-NEXT: SymbolName: '__test_block_invoke_kernel@kd' ; CHECK-NEXT: Language: OpenCL C ; CHECK-NEXT: LanguageVersion: [ 2, 0 ] ; CHECK-NEXT: Attrs: ; CHECK-NEXT: RuntimeHandle: __test_block_invoke_kernel_runtime_handle ; CHECK-NEXT: Args: -; CHECK-NEXT: - Size: 25 +; CHECK-NEXT: - TypeName: __block_literal +; CHECK-NEXT: Size: 25 ; CHECK-NEXT: Align: 1 ; CHECK-NEXT: ValueKind: ByValue ; CHECK-NEXT: ValueType: Struct ; CHECK-NEXT: AccQual: Default -; CHECK-NEXT: TypeName: __block_literal ; CHECK-NEXT: - Size: 8 ; CHECK-NEXT: Align: 8 ; CHECK-NEXT: ValueKind: HiddenGlobalOffsetX diff --git a/test/CodeGen/AMDGPU/hsa-metadata-images.ll b/test/CodeGen/AMDGPU/hsa-metadata-images.ll index a29f86d0170..286f57399b7 100644 --- a/test/CodeGen/AMDGPU/hsa-metadata-images.ll +++ b/test/CodeGen/AMDGPU/hsa-metadata-images.ll @@ -19,44 +19,45 @@ ; CHECK: Version: [ 1, 0 ] ; CHECK: Kernels: -; CHECK: - Name: test +; CHECK: - Name: test +; CHECK: SymbolName: 'test@kd' ; CHECK: Args: -; CHECK: - Size: 8 +; CHECK: - TypeName: image1d_t +; CHECK: Size: 8 ; CHECK: ValueKind: Image -; CHECK: TypeName: image1d_t -; CHECK: - Size: 8 +; CHECK: - TypeName: image1d_array_t +; CHECK: Size: 8 ; CHECK: ValueKind: Image -; CHECK: TypeName: image1d_array_t -; CHECK: - Size: 8 +; CHECK: - TypeName: image1d_buffer_t +; CHECK: Size: 8 ; CHECK: ValueKind: Image -; CHECK: TypeName: image1d_buffer_t -; CHECK: - Size: 8 +; CHECK: - TypeName: image2d_t +; CHECK: Size: 8 ; CHECK: ValueKind: Image -; CHECK: TypeName: image2d_t -; CHECK: - Size: 8 +; CHECK: - TypeName: image2d_array_t +; CHECK: Size: 8 ; CHECK: ValueKind: Image -; CHECK: TypeName: image2d_array_t -; CHECK: - Size: 8 +; CHECK: - TypeName: image2d_array_depth_t +; CHECK: Size: 8 ; CHECK: ValueKind: Image -; CHECK: TypeName: image2d_array_depth_t -; CHECK: - Size: 8 +; CHECK: - TypeName: image2d_array_msaa_t +; CHECK: Size: 8 ; CHECK: ValueKind: Image -; CHECK: TypeName: image2d_array_msaa_t -; CHECK: - Size: 8 +; CHECK: - TypeName: image2d_array_msaa_depth_t +; CHECK: Size: 8 ; CHECK: ValueKind: Image -; CHECK: TypeName: image2d_array_msaa_depth_t -; CHECK: - Size: 8 +; CHECK: - TypeName: image2d_depth_t +; CHECK: Size: 8 ; CHECK: ValueKind: Image -; CHECK: TypeName: image2d_depth_t -; CHECK: - Size: 8 +; CHECK: - TypeName: image2d_msaa_t +; CHECK: Size: 8 ; CHECK: ValueKind: Image -; CHECK: TypeName: image2d_msaa_t -; CHECK: - Size: 8 +; CHECK: - TypeName: image2d_msaa_depth_t +; CHECK: Size: 8 ; CHECK: ValueKind: Image -; CHECK: TypeName: image2d_msaa_depth_t -; CHECK: - Size: 8 +; CHECK: - TypeName: image3d_t +; CHECK: Size: 8 ; CHECK: ValueKind: Image -; CHECK: TypeName: image3d_t define amdgpu_kernel void @test(%opencl.image1d_t addrspace(1)* %a, %opencl.image1d_array_t addrspace(1)* %b, %opencl.image1d_buffer_t addrspace(1)* %c, diff --git a/test/CodeGen/AMDGPU/hsa-metadata-kernel-code-props.ll b/test/CodeGen/AMDGPU/hsa-metadata-kernel-code-props.ll index c10c69a92c7..ae839bb079a 100644 --- a/test/CodeGen/AMDGPU/hsa-metadata-kernel-code-props.ll +++ b/test/CodeGen/AMDGPU/hsa-metadata-kernel-code-props.ll @@ -6,19 +6,20 @@ ; CHECK: Version: [ 1, 0 ] ; CHECK: Kernels: -; CHECK: - Name: test +; CHECK: - Name: test +; CHECK: SymbolName: 'test@kd' ; CHECK: CodeProps: ; CHECK: KernargSegmentSize: 24 -; GFX700: WavefrontNumSGPRs: 6 -; GFX800: WavefrontNumSGPRs: 96 -; GFX900: WavefrontNumSGPRs: 6 -; GFX700: WorkitemNumVGPRs: 4 -; GFX800: WorkitemNumVGPRs: 6 -; GFX900: WorkitemNumVGPRs: 6 -; CHECK: KernargSegmentAlign: 4 -; CHECK: GroupSegmentAlign: 4 -; CHECK: PrivateSegmentAlign: 4 -; CHECK: WavefrontSize: 6 +; CHECK: GroupSegmentFixedSize: 0 +; CHECK: PrivateSegmentFixedSize: 0 +; CHECK: KernargSegmentAlign: 8 +; CHECK: WavefrontSize: 64 +; GFX700: NumSGPRs: 6 +; GFX800: NumSGPRs: 96 +; GFX900: NumSGPRs: 6 +; GFX700: NumVGPRs: 4 +; GFX800: NumVGPRs: 6 +; GFX900: NumVGPRs: 6 define amdgpu_kernel void @test( half addrspace(1)* %r, half addrspace(1)* %a, diff --git a/test/CodeGen/AMDGPU/hsa-metadata-kernel-debug-props.ll b/test/CodeGen/AMDGPU/hsa-metadata-kernel-debug-props.ll index a8639453485..f9b94d19143 100644 --- a/test/CodeGen/AMDGPU/hsa-metadata-kernel-debug-props.ll +++ b/test/CodeGen/AMDGPU/hsa-metadata-kernel-debug-props.ll @@ -8,7 +8,8 @@ declare void @llvm.dbg.declare(metadata, metadata, metadata) ; CHECK: Version: [ 1, 0 ] ; CHECK: Kernels: -; CHECK: - Name: test +; CHECK: - Name: test +; CHECK: SymbolName: 'test@kd' ; CHECK: DebugProps: ; CHECK: DebuggerABIVersion: [ 1, 0 ] ; CHECK: ReservedNumVGPRs: 4 diff --git a/test/MC/AMDGPU/hsa-metadata-kernel-args.s b/test/MC/AMDGPU/hsa-metadata-kernel-args.s index 3416fff2814..2f9960ffaa0 100644 --- a/test/MC/AMDGPU/hsa-metadata-kernel-args.s +++ b/test/MC/AMDGPU/hsa-metadata-kernel-args.s @@ -9,15 +9,16 @@ // CHECK: - '2:1:8:%g\n' // CHECK: Kernels: // CHECK: - Name: test_kernel +// CHECK: SymbolName: 'test_kernel@kd' // CHECK: Language: OpenCL C // CHECK: LanguageVersion: [ 2, 0 ] // CHECK: Args: -// CHECK: - Size: 1 +// CHECK: - TypeName: char +// CHECK: Size: 1 // CHECK: Align: 1 // CHECK: ValueKind: ByValue // CHECK: ValueType: I8 // CHECK: AccQual: Default -// CHECK: TypeName: char // CHECK: - Size: 8 // CHECK: Align: 8 // CHECK: ValueKind: HiddenGlobalOffsetX @@ -41,15 +42,16 @@ Printf: [ '1:1:4:%d\n', '2:1:8:%g\n' ] Kernels: - Name: test_kernel + SymbolName: test_kernel@kd Language: OpenCL C LanguageVersion: [ 2, 0 ] Args: - - Size: 1 + - TypeName: char + Size: 1 Align: 1 ValueKind: ByValue ValueType: I8 AccQual: Default - TypeName: char - Size: 8 Align: 8 ValueKind: HiddenGlobalOffsetX diff --git a/test/MC/AMDGPU/hsa-metadata-kernel-attrs.s b/test/MC/AMDGPU/hsa-metadata-kernel-attrs.s index 525d25e521d..5a9fdd22069 100644 --- a/test/MC/AMDGPU/hsa-metadata-kernel-attrs.s +++ b/test/MC/AMDGPU/hsa-metadata-kernel-attrs.s @@ -9,6 +9,7 @@ // CHECK: - '2:1:8:%g\n' // CHECK: Kernels: // CHECK: - Name: test_kernel +// CHECK: SymbolName: 'test_kernel@kd' // CHECK: Language: OpenCL C // CHECK: LanguageVersion: [ 2, 0 ] // CHECK: Attrs: @@ -21,6 +22,7 @@ Printf: [ '1:1:4:%d\n', '2:1:8:%g\n' ] Kernels: - Name: test_kernel + SymbolName: test_kernel@kd Language: OpenCL C LanguageVersion: [ 2, 0 ] Attrs: diff --git a/test/MC/AMDGPU/hsa-metadata-kernel-code-props.s b/test/MC/AMDGPU/hsa-metadata-kernel-code-props.s index 062e671357a..e290235b16c 100644 --- a/test/MC/AMDGPU/hsa-metadata-kernel-code-props.s +++ b/test/MC/AMDGPU/hsa-metadata-kernel-code-props.s @@ -5,20 +5,24 @@ // CHECK: .amd_amdgpu_hsa_metadata // CHECK: Version: [ 1, 0 ] // CHECK: Kernels: -// CHECK: - Name: test_kernel +// CHECK: - Name: test_kernel +// CHECK: SymbolName: 'test_kernel@kd' // CHECK: CodeProps: -// CHECK: KernargSegmentSize: 24 -// CHECK: WorkitemPrivateSegmentSize: 16 -// CHECK: WavefrontNumSGPRs: 6 -// CHECK: WorkitemNumVGPRs: 12 +// CHECK: KernargSegmentSize: 24 +// CHECK: GroupSegmentFixedSize: 24 +// CHECK: PrivateSegmentFixedSize: 16 +// CHECK: KernargSegmentAlign: 16 +// CHECK: WavefrontSize: 64 .amd_amdgpu_hsa_metadata Version: [ 1, 0 ] Printf: [ '1:1:4:%d\n', '2:1:8:%g\n' ] Kernels: - Name: test_kernel + SymbolName: test_kernel@kd CodeProps: - KernargSegmentSize: 24 - WorkitemPrivateSegmentSize: 16 - WavefrontNumSGPRs: 6 - WorkitemNumVGPRs: 12 + KernargSegmentSize: 24 + GroupSegmentFixedSize: 24 + PrivateSegmentFixedSize: 16 + KernargSegmentAlign: 16 + WavefrontSize: 64 .end_amd_amdgpu_hsa_metadata diff --git a/test/MC/AMDGPU/hsa-metadata-kernel-debug-props.s b/test/MC/AMDGPU/hsa-metadata-kernel-debug-props.s index 950049d115e..7efb8207ae4 100644 --- a/test/MC/AMDGPU/hsa-metadata-kernel-debug-props.s +++ b/test/MC/AMDGPU/hsa-metadata-kernel-debug-props.s @@ -5,7 +5,8 @@ // CHECK: .amd_amdgpu_hsa_metadata // CHECK: Version: [ 1, 0 ] // CHECK: Kernels: -// CHECK: - Name: test_kernel +// CHECK: - Name: test_kernel +// CHECK: SymbolName: 'test_kernel@kd' // CHECK: DebugProps: // CHECK: DebuggerABIVersion: [ 1, 0 ] // CHECK: ReservedNumVGPRs: 4 @@ -17,6 +18,7 @@ Printf: [ '1:1:4:%d\n', '2:1:8:%g\n' ] Kernels: - Name: test_kernel + SymbolName: test_kernel@kd DebugProps: DebuggerABIVersion: [ 1, 0 ] ReservedNumVGPRs: 4 diff --git a/test/MC/AMDGPU/hsa-metadata-unknown-key.s b/test/MC/AMDGPU/hsa-metadata-unknown-key.s index 58d40209831..f532930c7c6 100644 --- a/test/MC/AMDGPU/hsa-metadata-unknown-key.s +++ b/test/MC/AMDGPU/hsa-metadata-unknown-key.s @@ -12,6 +12,7 @@ Printf: [ '1:1:4:%d\n', '2:1:8:%g\n' ] Kernels: - Name: test_kernel + SymbolName: test_kernel@kd Language: OpenCL C LanguageVersion: [ 2, 0 ] Args: diff --git a/test/MC/AMDGPU/hsa.s b/test/MC/AMDGPU/hsa.s index 710f115adb1..82136fbca8b 100644 --- a/test/MC/AMDGPU/hsa.s +++ b/test/MC/AMDGPU/hsa.s @@ -40,15 +40,19 @@ .amd_amdgpu_hsa_metadata Version: [ 3, 0 ] Kernels: - - Name: amd_kernel_code_t_test_all - - Name: amd_kernel_code_t_minimal + - Name: amd_kernel_code_t_test_all + SymbolName: amd_kernel_code_t_test_all@kd + - Name: amd_kernel_code_t_minimal + SymbolName: amd_kernel_code_t_minimal@kd .end_amd_amdgpu_hsa_metadata // ASM: .amd_amdgpu_hsa_metadata // ASM: Version: [ 3, 0 ] // ASM: Kernels: -// ASM: - Name: amd_kernel_code_t_test_all -// ASM: - Name: amd_kernel_code_t_minimal +// ASM: - Name: amd_kernel_code_t_test_all +// ASM: SymbolName: 'amd_kernel_code_t_test_all@kd' +// ASM: - Name: amd_kernel_code_t_minimal +// ASM: SymbolName: 'amd_kernel_code_t_minimal@kd' // ASM: .end_amd_amdgpu_hsa_metadata .amdgpu_hsa_kernel amd_kernel_code_t_test_all