Files
composable_kernel/include/ck/host_utility/device_prop.hpp
Illia Silin 717f2efef7 [rocm-libraries] ROCm/rocm-libraries#6978 (commit e58096d)
[CK] add composable kernel support on gfx1250 (#6978)

## Motivation

Add composable kernel support on gfx1250.

## Technical Details

<!-- Explain the changes along with any relevant GitHub links. -->

## Test Plan

<!-- Explain any relevant testing done to verify this PR. -->

## Test Result

<!-- Briefly summarize test outcomes. -->

## Submission Checklist

- [ ] Look over the contributing guidelines at
https://github.com/ROCm/ROCm/blob/develop/CONTRIBUTING.md#pull-requests.

---------

Co-authored-by: Qun Lin <qlin@amd.com>
Co-authored-by: jialuo12_amdeng <jia.luo@amd.com>
Co-authored-by: Andriy Roshchenko <andriy.roshchenko@amd.com>
Co-authored-by: hsivasun_amdeng <haresh.sivasuntharampillai@amd.com>
2026-05-15 06:46:51 -07:00

256 lines
6.8 KiB
C++

// Copyright (c) Advanced Micro Devices, Inc., or its affiliates.
// SPDX-License-Identifier: MIT
#pragma once
#ifndef __HIPCC_RTC__
#include <string>
#include <string_view>
#include <hip/hip_runtime.h>
namespace ck {
constexpr unsigned int fnv1a_hash(std::string_view str, unsigned int h = 2166136261u)
{
return str.empty() ? h
: fnv1a_hash(str.substr(1),
(h ^ static_cast<unsigned char>(str.front())) * 16777619u);
}
inline std::string get_device_name()
{
hipDeviceProp_t props{};
int device;
auto status = hipGetDevice(&device);
if(status != hipSuccess)
{
return std::string();
}
status = hipGetDeviceProperties(&props, device);
if(status != hipSuccess)
{
return std::string();
}
const std::string raw_name(props.gcnArchName);
const auto name = raw_name.substr(0, raw_name.find(':')); // str.substr(0, npos) returns str.
switch(fnv1a_hash(name))
{
// https://github.com/ROCm/MIOpen/blob/8498875aef84878e04c1eabefdf6571514891086/src/target_properties.cpp#L40
case fnv1a_hash("Ellesmere"):
case fnv1a_hash("Baffin"):
case fnv1a_hash("RacerX"):
case fnv1a_hash("Polaris10"):
case fnv1a_hash("Polaris11"):
case fnv1a_hash("Tonga"):
case fnv1a_hash("Fiji"):
case fnv1a_hash("gfx800"):
case fnv1a_hash("gfx802"):
case fnv1a_hash("gfx804"): return "gfx803";
case fnv1a_hash("Vega10"):
case fnv1a_hash("gfx901"): return "gfx900";
case fnv1a_hash("10.3.0 Sienna_Cichlid 18"): return "gfx1030";
default: return name;
}
}
inline bool is_gfx90a() { return ck::get_device_name() == "gfx90a"; }
inline int get_device_revision()
{
hipDeviceProp_t props{};
int device;
auto status = hipGetDevice(&device);
if(status != hipSuccess)
{
return -1; // Error: cannot get device
}
status = hipGetDeviceProperties(&props, device);
if(status != hipSuccess)
{
return -1; // Error: cannot get device properties
}
return props.asicRevision;
}
inline bool is_gfx12_supported()
{
return ck::get_device_name() == "gfx1200" || ck::get_device_name() == "gfx1201" ||
ck::get_device_name() == "gfx1250";
}
inline bool is_gfx11_supported()
{
return ck::get_device_name() == "gfx1100" || ck::get_device_name() == "gfx1101" ||
ck::get_device_name() == "gfx1102" || ck::get_device_name() == "gfx1103" ||
ck::get_device_name() == "gfx1150" || ck::get_device_name() == "gfx1151" ||
ck::get_device_name() == "gfx1152" || ck::get_device_name() == "gfx1153";
}
inline bool is_gfx101_supported()
{
return ck::get_device_name() == "gfx1010" || ck::get_device_name() == "gfx1011" ||
ck::get_device_name() == "gfx1012";
}
inline bool is_gfx103_supported()
{
return ck::get_device_name() == "gfx1030" || ck::get_device_name() == "gfx1031" ||
ck::get_device_name() == "gfx1032" || ck::get_device_name() == "gfx1033" ||
ck::get_device_name() == "gfx1034" || ck::get_device_name() == "gfx1035" ||
ck::get_device_name() == "gfx1036";
}
inline bool is_gfx120_supported()
{
return ck::get_device_name() == "gfx1200" || ck::get_device_name() == "gfx1201";
}
inline bool is_gfx125_supported() { return ck::get_device_name() == "gfx1250"; }
inline bool is_xdl_supported()
{
return ck::get_device_name() == "gfx908" || ck::get_device_name() == "gfx90a" ||
ck::get_device_name() == "gfx942" || ck::get_device_name() == "gfx950" ||
is_gfx12_supported() || is_gfx11_supported();
}
template <typename ADataType,
typename BDataType,
index_t MPerXDL64,
index_t NPerXDL64,
index_t MPerXDL32 = MPerXDL64,
index_t NPerXDL32 = NPerXDL64>
inline bool is_xdl_wmma_supported()
{
if(ck::get_device_name() == "gfx908" || ck::get_device_name() == "gfx90a" ||
ck::get_device_name() == "gfx942" || ck::get_device_name() == "gfx950")
{
return true;
}
else if(is_gfx120_supported() || is_gfx11_supported())
{
if constexpr((MPerXDL32 != 16) || (NPerXDL32 != 16))
{
return false;
}
if constexpr(sizeof(ADataType) > 2 || sizeof(BDataType) > 2)
{
return false;
}
return true;
}
else if(is_gfx125_supported())
{
if constexpr((MPerXDL32 != 16) || (NPerXDL32 != 16))
{
return false;
}
if constexpr(sizeof(ADataType) > 4 || sizeof(BDataType) > 4)
{
if(ck::get_device_name() == "gfx1250")
{
return false;
}
}
return true;
}
else
{
return false;
}
}
template <typename ADataType, index_t KPerBlock, index_t KPack = 256>
inline bool is_xdl_wmma_k_supported()
{
if(is_gfx125_supported())
{
if constexpr(sizeof(ADataType) == 1)
{
return (KPerBlock % 64 == 0) && (KPack % 32 == 0);
}
else if constexpr(sizeof(ADataType) == 2)
{
return (KPerBlock % 32 == 0) && (KPack % 16 == 0);
}
return true;
}
else if(is_gfx120_supported())
{
return (KPerBlock % 16 == 0) && (KPack % 8 == 0);
}
else if(is_gfx11_supported())
{
return (KPerBlock % 16 == 0) && (KPack % 16 == 0);
}
return true;
}
template <typename ADataType, index_t K1 = 0>
inline index_t __host__ get_wmma_k()
{
if(is_gfx125_supported())
{
return 64 / sizeof(ADataType);
}
else
{
return K1 == 16 ? 32 : 16;
}
}
template <typename ADataType, index_t K1 = 0>
inline index_t __device__ get_wmma_k()
{
#if defined(__gfx125__)
return 64 / sizeof(ADataType);
#else
return K1 == 16 ? 32 : 16;
#endif
}
inline bool is_lds_direct_load_supported()
{
// Check if direct loads from global memory to LDS are supported.
return ck::get_device_name() == "gfx90a" || ck::get_device_name() == "gfx942" ||
ck::get_device_name() == "gfx950" || is_gfx125_supported();
}
inline bool is_bf16_atomic_supported()
{
return ck::get_device_name() == "gfx942" || ck::get_device_name() == "gfx950" ||
is_gfx12_supported();
}
inline bool is_wmma_supported()
{
return is_gfx103_supported() || is_gfx11_supported() || is_gfx12_supported();
}
inline bool is_tf32_supported()
{
return ck::get_device_name() == "gfx942" || ck::get_device_name() == "gfx950";
}
inline int __host__ get_lds_size()
{
int device = 0;
int result = 0;
auto status = hipGetDevice(&device);
if(status == hipSuccess)
{
status = hipDeviceGetAttribute(&result, hipDeviceAttributeMaxSharedMemoryPerBlock, device);
if(status == hipSuccess)
{
return result;
}
}
return 64 * 1024;
}
} // namespace ck
#endif