Use mfma 16x16x32

This commit is contained in:
mhYang
2025-03-31 23:18:22 +00:00
parent ee28e965f2
commit d1dbc69eda

View File

@@ -71,9 +71,9 @@ struct GridGemm
static constexpr index_t M_Warp = 2;
static constexpr index_t N_Warp = 2;
static constexpr index_t K_Warp = 1;
static constexpr index_t M_Warp_Tile = 32;
static constexpr index_t N_Warp_Tile = 32;
static constexpr index_t K_Warp_Tile = 16;
static constexpr index_t M_Warp_Tile = 16;
static constexpr index_t N_Warp_Tile = 16;
static constexpr index_t K_Warp_Tile = 32;
static constexpr bool DoubleSmemBuffer = false;
static constexpr bool kPadM = false;
static constexpr bool kPadN = false;