Use kM0=128 kN0=64 to completely remove the vgprs spilling

This commit is contained in:
Qianfeng Zhang
2025-04-15 15:08:46 +00:00
parent 3cd1b13e46
commit d1749b3aae

View File

@@ -35,7 +35,7 @@ struct HstuAttentionFwdBlockTile<64>
template <>
struct HstuAttentionFwdBlockTile<128>
{
using type = ck_tile::sequence<128, 128, 32, 128, 32, 128>;
using type = ck_tile::sequence<128, 64, 32, 128, 32, 128>;
using gemm0_warps = ck_tile::sequence<4, 1, 1>;
using gemm1_warps = ck_tile::sequence<4, 1, 1>;
};