mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-07-01 20:27:42 +00:00
Remove oversubscription.
This commit is contained in:
@@ -528,9 +528,7 @@ struct DeviceGroupedConvBwdWeight_Xdl_CShuffleV3
|
||||
get_bwd_weight_gemm_sizes<NDimSpatial>(a_g_n_k_wos_lengths, e_g_k_c_xs_lengths);
|
||||
const auto k_grid_size = k_dim_size_ / K0PerBlock;
|
||||
|
||||
// For V3 pipeline, it is beneficial to oversubscribe and consider the total grid size to be only
|
||||
// the grid of the GEMM output tiles.
|
||||
const auto total_grid_size = grid_size_mn;
|
||||
const auto total_grid_size = grid_size_mn * Conv_G_;
|
||||
k_batch_ = split_k_parameters.strategy_== SplitKStrategy::BestOccupancy
|
||||
? get_best_occupancy_k_batch_value(max_occupancy.value_, total_grid_size)
|
||||
: get_optimized_k_batch_value(max_occupancy.value_, grid_size_mn, k_grid_size);
|
||||
|
||||
Reference in New Issue
Block a user