Change to tile setting to use mfma-32x32x16 for WithSoftmax pipeline on gfx950

This commit is contained in:
Qianfeng Zhang
2026-02-05 15:57:18 +00:00
parent 8af5e26717
commit d169ed2194

View File

@@ -260,7 +260,7 @@ struct HstuAttentionWithSoftmaxFwdBlockTile<96>
template <>
struct HstuAttentionWithSoftmaxFwdBlockTile<128>
{
using type = ck_tile::sequence<128, 64, 16, 128, 32, 128>;
using type = ck_tile::sequence<128, 64, 32, 128, 16, 128>;
using gemm0_warps = ck_tile::sequence<4, 1, 1>;
using gemm1_warps = ck_tile::sequence<4, 1, 1>;
};
@@ -373,9 +373,9 @@ struct HstuAttentionWithSoftmaxFwdTileSetting<128>
using Type = ck_tile::HstuAttentionFwdTileSettingClass<
typename HstuAttentionWithSoftmaxFwdBlockTile<128>::type,
typename HstuAttentionWithSoftmaxFwdBlockTile<128>::gemm0_warps,
WarpTile_16x16x32,
WarpTile_32x32x16,
typename HstuAttentionWithSoftmaxFwdBlockTile<128>::gemm1_warps,
WarpTile_16x16x32>;
WarpTile_32x32x16>;
};
template <>