mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-04-20 06:49:15 +00:00
[rocm-libraries] ROCm/rocm-libraries#4407 (commit adde219)
[CK][CK TILE] Add has hot loop check for pipeline v1 ## Motivation Add has hot loop check for pipeline v1 (v1 basic and v1 basic async). Enable more tests which have been fixed by this change. ## Technical Details Hot loop has been executed without num loop check. ## Test Plan test_grouped_convnd_fwd_tile ## Test Result Passed ## Submission Checklist - [x] Look over the contributing guidelines at https://github.com/ROCm/ROCm/blob/develop/CONTRIBUTING.md#pull-requests. AICK-651 AICK-663
This commit is contained in:
committed by
assistant-librarian[bot]
parent
e88f139c6c
commit
2dd2f114b3
@@ -85,6 +85,13 @@ __device__ inline auto amd_wave_read_first_lane(const Object& obj)
|
||||
return out;
|
||||
}
|
||||
|
||||
// Overload for host to return the same value
|
||||
template <typename T>
|
||||
__host__ inline T amd_wave_read_first_lane(T v)
|
||||
{
|
||||
return v;
|
||||
}
|
||||
|
||||
// 128 bit SGPRs to supply buffer resource in buffer instructions
|
||||
// https://rocm-documentation.readthedocs.io/en/latest/GCN_ISA_Manuals/testdocbook.html#vector-memory-buffer-instructions
|
||||
struct __attribute__((packed)) buffer_resource
|
||||
|
||||
@@ -81,6 +81,13 @@ __device__ inline auto amd_wave_read_first_lane(const Object& obj)
|
||||
return out;
|
||||
}
|
||||
|
||||
// Overload for host to return the same value
|
||||
template <typename T>
|
||||
__host__ inline T amd_wave_read_first_lane(T v)
|
||||
{
|
||||
return v;
|
||||
}
|
||||
|
||||
// 128 bit SGPRs to supply buffer resource in buffer instructions
|
||||
// https://rocm-documentation.readthedocs.io/en/latest/GCN_ISA_Manuals/testdocbook.html#vector-memory-buffer-instructions
|
||||
struct __attribute__((packed)) buffer_resource
|
||||
|
||||
Reference in New Issue
Block a user