From bd0444f3656b44ab37f2bc5a8bbb5c6654a4519d Mon Sep 17 00:00:00 2001 From: Qianfeng Zhang Date: Thu, 6 Nov 2025 08:20:11 +0000 Subject: [PATCH] [Performance] Change the tile settings for mi350/trload no_softmax pipeline to enable to use mfma-16x16x32 for Gemm-1 --- .../ck_tile/18_hstu_attention/hstu_attention_fwd_setting.hpp | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/example/ck_tile/18_hstu_attention/hstu_attention_fwd_setting.hpp b/example/ck_tile/18_hstu_attention/hstu_attention_fwd_setting.hpp index 096bb69a8c..43207799eb 100644 --- a/example/ck_tile/18_hstu_attention/hstu_attention_fwd_setting.hpp +++ b/example/ck_tile/18_hstu_attention/hstu_attention_fwd_setting.hpp @@ -206,7 +206,7 @@ struct HstuAttentionNoSoftmaxFwdBlockTile<64> template <> struct HstuAttentionNoSoftmaxFwdBlockTile<128> { - using type = ck_tile::sequence<128, 32, 128, 16, 128>; + using type = ck_tile::sequence<128, 32, 128, 32, 128>; using gemm0_warps = ck_tile::sequence<4, 1, 1>; using gemm1_warps = ck_tile::sequence<4, 1, 1>; }; @@ -289,7 +289,7 @@ struct HstuAttentionNoSoftmaxFwdTileSetting<128> typename HstuAttentionNoSoftmaxFwdBlockTile<128>::gemm0_warps, HstuAttentionFwdWarpTile2, typename HstuAttentionNoSoftmaxFwdBlockTile<128>::gemm1_warps, - HstuAttentionFwdWarpTile1>; + HstuAttentionFwdWarpTile2>; }; template <>