Change in GetKVBlockGemm to let gemm1 to use WarpTile-16x16x16/32x32x8 on mi350

This commit is contained in:
Qianfeng Zhang
2025-12-05 02:04:27 +00:00
parent 98f9b4a47b
commit c32949b285

View File

@@ -525,15 +525,9 @@ struct BlockFmhaPipelineQRKSVSWholeKPrefetchDefaultPolicy
constexpr index_t WarpGemmK =
Problem::BlockFmhaShape::Gemm1WarpTile::at(number<2>{});
#ifdef __gfx950__
static_assert((WarpGemmM == 16 && WarpGemmK == 32) ||
(WarpGemmM == 32 && WarpGemmK == 16),
"Not supported WarpGemm sizes!");
#else
static_assert((WarpGemmM == 16 && (WarpGemmK == 16 || WarpGemmK == 32)) ||
(WarpGemmM == 32 && (WarpGemmK == 8 || WarpGemmK == 16)),
"Not supported WarpGemm sizes!");
#endif
if constexpr((WarpGemmM == 16 && WarpGemmK == 32) ||
(WarpGemmM == 32 && WarpGemmK == 16))