Merge commit '28ad8ae5d8558e147f29aba29db569fe25210947' into develop

This commit is contained in:
assistant-librarian[bot]
2025-09-29 23:11:42 +00:00
parent 78f2779870
commit 631a25de61
2 changed files with 6 additions and 2 deletions

View File

@@ -231,7 +231,7 @@ struct SplitKTwoStageInvoker
preprocess = clear_gemm_output;
}
return ck_tile::launch_kernel_time_mask(
ave_time = ck_tile::launch_kernel_time_mask(
s,
preprocess,
ck_tile::make_kernel<GemmConfig::kBlockPerCu>(
@@ -245,6 +245,8 @@ struct SplitKTwoStageInvoker
ck_tile::make_tuple(args.N, 1), // Output Stride
input_tensors,
static_cast<CDataType*>(c_ptr)));
return ave_time;
};
const auto RunSplitk = [&](const auto has_hot_loop_, const auto tail_number_) {

View File

@@ -174,10 +174,12 @@ struct UniversalInvoker
preprocess = clear_gemm_output;
}
return ck_tile::launch_kernel_time_mask(
ave_time = ck_tile::launch_kernel_time_mask(
s,
preprocess,
ck_tile::make_kernel<GemmConfig::kBlockPerCu>(Kernel{}, grids, blocks, 0, kargs));
return ave_time;
};
const auto RunSplitk = [&](const auto has_hot_loop_, const auto tail_number_) {