[rocm-libraries] ROCm/rocm-libraries#4875 (commit e35e3f2)

[CK] Port non-grouped convolution instances to the grouped
 kernels (#4875)

## Motivation

Port non-grouped convolution instances to the grouped kernels to
deprecated older non-grouped implementations.

## Technical Details

Add the same instances as non-grouped but using grouped kernel.

## Test Plan

test_grouped_convnd_fwd

## Test Result

pass

## Submission Checklist

- [x] Look over the contributing guidelines at
https://github.com/ROCm/ROCm/blob/develop/CONTRIBUTING.md#pull-requests.

AICK-724
This commit is contained in:
Bartłomiej Kocot
2026-02-28 01:25:33 +00:00
committed by assistant-librarian[bot]
parent b661eab573
commit ef82340e05
6 changed files with 219 additions and 0 deletions

View File

@@ -376,6 +376,10 @@ struct GridwiseGemmMultipleD_xdl_cshuffle
return false;
}
if constexpr(KPerBlock < 16)
{
return false;
}
#endif
if constexpr(Base::GetSharedMemoryNumberOfByte(get_device_arch()) >
@@ -415,6 +419,16 @@ struct GridwiseGemmMultipleD_xdl_cshuffle
static_assert(KPerBlock % AK1Value == 0 && KPerBlock % BK1Value == 0,
"KPerBlock must be divisible by AK1Value and BK1Value!");
#ifndef __HIPCC_RTC__
if constexpr(KPerBlock < 16)
{
if(ck::is_gfx12_supported() || ck::is_gfx11_supported())
{
return false;
}
}
#endif
const auto M = a_grid_desc_m_k.GetLength(I0);
const auto N = b_grid_desc_n_k.GetLength(I0);
const auto AK = a_grid_desc_m_k.GetLength(I1);