mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-06-29 11:16:59 +00:00
add limiting for N0/NWave
This commit is contained in:
@@ -923,20 +923,14 @@ struct GridwiseGemmMultiD_xdl_cshuffle_v3_b_preshuffle
|
||||
static_assert((MPerBlock % (MPerXdl * MXdlPerWave) == 0) &&
|
||||
(NPerBlock % (NXdlPerWave * NPerXdl)) == 0,
|
||||
"Invalid tuning param!");
|
||||
// should remove kpading
|
||||
if((GemmSpec == tensor_operation::device::GemmSpecialization::KPadding) &&
|
||||
((karg.BK0Shuffled % karg.KBatch) != 0))
|
||||
{
|
||||
return false;
|
||||
}
|
||||
|
||||
// for not adding k padd operator
|
||||
if(CalculateBKShufflePadded(karg.K) % KPerBlock != 0)
|
||||
if((CalculateBKShufflePadded(karg.K) % KPerBlock != 0) ||
|
||||
(karg.BK0Shuffled % karg.KBatch != 0))
|
||||
{
|
||||
return false;
|
||||
}
|
||||
|
||||
if(karg.N % NPerXdl != 0)
|
||||
if((karg.N % NPerXdl != 0) || (karg.BN0Shuffled % NWave != 0))
|
||||
{
|
||||
return false;
|
||||
}
|
||||
|
||||
Reference in New Issue
Block a user