add the check of granularity for atomic add (#2959)

[ROCm/composable_kernel commit: cadafde722]
This commit is contained in:
Thomas Ning
2025-10-02 11:15:24 -07:00
committed by GitHub
parent 1aa5b318cb
commit 0959c6582a
2 changed files with 8 additions and 4 deletions

View File

@@ -682,6 +682,10 @@ struct DeviceGemmMultiD_Xdl_CShuffle_V3 : public DeviceGemmMultipleDSplitK<ALayo
return GridwiseGemm64::CheckValidity(arg);
}
}
if(CDEShuffleBlockTransferScalarPerVectors{}[Number<0>{}] <= 1 && (arg.KBatch > 1))
{
return false;
}
else
{
if constexpr(NXdlPerWave32 > 0)