add the check of granularity for atomic add (#2959)

This commit is contained in:
Thomas Ning
2025-10-02 11:15:24 -07:00
committed by GitHub
parent 6fc28ab493
commit cadafde722
2 changed files with 8 additions and 4 deletions

View File

@@ -682,6 +682,10 @@ struct DeviceGemmMultiD_Xdl_CShuffle_V3 : public DeviceGemmMultipleDSplitK<ALayo
return GridwiseGemm64::CheckValidity(arg);
}
}
if(CDEShuffleBlockTransferScalarPerVectors{}[Number<0>{}] <= 1 && (arg.KBatch > 1))
{
return false;
}
else
{
if constexpr(NXdlPerWave32 > 0)