[CK] Fix example_grouped_conv_bwd_data_xdl_fp16 with ksplit = 2 (#2943)

root cause:  AK1 and BK1 may different in class template. so we need calculate k0 per block separately when ksplit is not 1.
This commit is contained in:
linqunAMD
2025-09-29 22:56:33 +08:00
committed by GitHub
parent 5477811670
commit 769c58f133
2 changed files with 13 additions and 9 deletions

View File

@@ -1671,7 +1671,10 @@ struct DeviceGroupedConvBwdDataMultipleD_Xdl_CShuffle_v1
valid = false;
}
}
else
}
else
{
if constexpr(NXdlPerWave32 > 0)
{
if(!GridwiseGemmCTranspose32::CheckValidity(
arg.a_grid_desc_m_k_container_[i],
@@ -1686,10 +1689,10 @@ struct DeviceGroupedConvBwdDataMultipleD_Xdl_CShuffle_v1
valid = false;
}
}
if(!valid)
{
return false;
}
}
if(!valid)
{
return false;
}
}