This commit is contained in:
AMD-dteng
2025-03-24 22:55:46 +08:00
parent 3e2ee2f3a4
commit 921c9dfc9a
2 changed files with 4 additions and 2 deletions

View File

@@ -27,8 +27,8 @@ float flatmm_calc(const ck_tile::FlatmmHostArgs& args, const ck_tile::stream_con
constexpr ck_tile::index_t N_Tile = 128;
constexpr ck_tile::index_t K_Tile = 64;
constexpr ck_tile::index_t M_Warp = 1;
constexpr ck_tile::index_t N_Warp = 4;
constexpr ck_tile::index_t M_Warp = 2;
constexpr ck_tile::index_t N_Warp = 2;
constexpr ck_tile::index_t K_Warp = 1;
constexpr ck_tile::index_t M_Warp_Tile = 32;

View File

@@ -246,6 +246,8 @@ struct FlatmmPipelineAGmemBGmemCRegV1
});
});
block_sync_lds();
// GEMM i
block_flatmm(c_block_tile, a_lds_gemm_window, b_warp_tensor_2);