mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-04-20 06:49:15 +00:00
[rocm-libraries] ROCm/rocm-libraries#4875 (commit e35e3f2)
[CK] Port non-grouped convolution instances to the grouped kernels (#4875) ## Motivation Port non-grouped convolution instances to the grouped kernels to deprecated older non-grouped implementations. ## Technical Details Add the same instances as non-grouped but using grouped kernel. ## Test Plan test_grouped_convnd_fwd ## Test Result pass ## Submission Checklist - [x] Look over the contributing guidelines at https://github.com/ROCm/ROCm/blob/develop/CONTRIBUTING.md#pull-requests. AICK-724
This commit is contained in:
committed by
assistant-librarian[bot]
parent
b661eab573
commit
ef82340e05
@@ -376,6 +376,10 @@ struct GridwiseGemmMultipleD_xdl_cshuffle
|
||||
|
||||
return false;
|
||||
}
|
||||
if constexpr(KPerBlock < 16)
|
||||
{
|
||||
return false;
|
||||
}
|
||||
#endif
|
||||
|
||||
if constexpr(Base::GetSharedMemoryNumberOfByte(get_device_arch()) >
|
||||
@@ -415,6 +419,16 @@ struct GridwiseGemmMultipleD_xdl_cshuffle
|
||||
static_assert(KPerBlock % AK1Value == 0 && KPerBlock % BK1Value == 0,
|
||||
"KPerBlock must be divisible by AK1Value and BK1Value!");
|
||||
|
||||
#ifndef __HIPCC_RTC__
|
||||
if constexpr(KPerBlock < 16)
|
||||
{
|
||||
if(ck::is_gfx12_supported() || ck::is_gfx11_supported())
|
||||
{
|
||||
return false;
|
||||
}
|
||||
}
|
||||
#endif
|
||||
|
||||
const auto M = a_grid_desc_m_k.GetLength(I0);
|
||||
const auto N = b_grid_desc_n_k.GetLength(I0);
|
||||
const auto AK = a_grid_desc_m_k.GetLength(I1);
|
||||
|
||||
Reference in New Issue
Block a user