mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-04-19 22:39:03 +00:00
add the check of granularity for atomic add (#2959)
This commit is contained in:
@@ -682,6 +682,10 @@ struct DeviceGemmMultiD_Xdl_CShuffle_V3 : public DeviceGemmMultipleDSplitK<ALayo
|
||||
return GridwiseGemm64::CheckValidity(arg);
|
||||
}
|
||||
}
|
||||
if(CDEShuffleBlockTransferScalarPerVectors{}[Number<0>{}] <= 1 && (arg.KBatch > 1))
|
||||
{
|
||||
return false;
|
||||
}
|
||||
else
|
||||
{
|
||||
if constexpr(NXdlPerWave32 > 0)
|
||||
|
||||
@@ -11,7 +11,7 @@ TYPED_TEST(TEST_SUITE_NAME, SmallM)
|
||||
std::vector<int> Ms{1, 2, 3, 4, 5, 6};
|
||||
constexpr int N = 1024;
|
||||
std::vector<int> Ks;
|
||||
for (auto K_count: {2, 3, 4, 10, 11})
|
||||
for(auto K_count : {2, 3, 4, 10, 11})
|
||||
{
|
||||
Ks.push_back(K_count * TestFixture::K_Tile);
|
||||
}
|
||||
@@ -36,10 +36,10 @@ TYPED_TEST(TEST_SUITE_NAME, SmallM)
|
||||
TYPED_TEST(TEST_SUITE_NAME, MidLargeM)
|
||||
{
|
||||
std::vector<int> Ms{127, 255, 312, 799, 1573};
|
||||
constexpr int N = 1024;
|
||||
constexpr int N = 1024;
|
||||
|
||||
std::vector<int> Ks;
|
||||
for (auto K_count: {2, 3, 4, 10, 11})
|
||||
for(auto K_count : {2, 3, 4, 10, 11})
|
||||
{
|
||||
Ks.push_back(K_count * TestFixture::K_Tile);
|
||||
}
|
||||
@@ -51,7 +51,7 @@ TYPED_TEST(TEST_SUITE_NAME, MidLargeM)
|
||||
|
||||
for(int M : Ms)
|
||||
{
|
||||
for (int K: Ks)
|
||||
for(int K : Ks)
|
||||
{
|
||||
if constexpr(std::is_same_v<typename TestFixture::ALayout,
|
||||
ck_tile::tensor_layout::gemm::ColumnMajor>)
|
||||
|
||||
Reference in New Issue
Block a user