mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-05-15 18:42:06 +00:00
Use kM0=128 kN0=64 to completely remove the vgprs spilling
This commit is contained in:
@@ -35,7 +35,7 @@ struct HstuAttentionFwdBlockTile<64>
|
||||
template <>
|
||||
struct HstuAttentionFwdBlockTile<128>
|
||||
{
|
||||
using type = ck_tile::sequence<128, 128, 32, 128, 32, 128>;
|
||||
using type = ck_tile::sequence<128, 64, 32, 128, 32, 128>;
|
||||
using gemm0_warps = ck_tile::sequence<4, 1, 1>;
|
||||
using gemm1_warps = ck_tile::sequence<4, 1, 1>;
|
||||
};
|
||||
|
||||
Reference in New Issue
Block a user