mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-07-01 12:17:00 +00:00
best perf pw gemm config 0.11ms
This commit is contained in:
4
example/ck_tile/03_gemm/gemm_utils.hpp
Normal file → Executable file
4
example/ck_tile/03_gemm/gemm_utils.hpp
Normal file → Executable file
@@ -280,8 +280,8 @@ struct GemmConfigPreshuffleDecode : public GemmConfigBase
|
||||
template <typename PrecType>
|
||||
struct GemmConfigPreshufflePrefill : public GemmConfigBase
|
||||
{
|
||||
static constexpr ck_tile::index_t M_Tile = 128;
|
||||
static constexpr ck_tile::index_t N_Tile = 128;
|
||||
static constexpr ck_tile::index_t M_Tile = 64;
|
||||
static constexpr ck_tile::index_t N_Tile = 256;
|
||||
static constexpr ck_tile::index_t K_Tile = 128 / sizeof(PrecType);
|
||||
|
||||
static constexpr ck_tile::index_t M_Warp = 1;
|
||||
|
||||
2
example/ck_tile/03_gemm/gemm_weight_preshuffle.cpp
Normal file → Executable file
2
example/ck_tile/03_gemm/gemm_weight_preshuffle.cpp
Normal file → Executable file
@@ -277,7 +277,7 @@ int main(int argc, char* argv[])
|
||||
|
||||
try
|
||||
{
|
||||
return !run_gemm_example<GemmConfigPreshuffleDecode>(arg_parser);
|
||||
return !run_gemm_example<GemmConfigPreshufflePrefill>(arg_parser);
|
||||
}
|
||||
catch(const std::runtime_error& e)
|
||||
{
|
||||
|
||||
Reference in New Issue
Block a user