mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-05-21 21:39:15 +00:00
Grouped Conv Bwd Weight Direct Load (#3648)
* Grouped Conv Bwd Weight Direct Load
* Update gridwise_gemm_xdl_cshuffle_conv_v3.hpp
* Implement group merging for bwd_weight and add instances
* Link direct load instances
* builder fixes
* fix
* fixes
* fix
---------
Co-authored-by: Graner, Johannes <johannes.graner@amd.com>
[ROCm/composable_kernel commit: 83b58bb0c3]
This commit is contained in:
@@ -32,7 +32,8 @@ constexpr auto ALGORITHM =
|
||||
.with_gemm_config(cku::BwdGemmParams_Xdl_1x1_per_wave)
|
||||
.with_transfer(cku::BwdTransfer_4x8x1_4x16x1_v3)
|
||||
.with_bwd_specialization(ckb::ConvSpecialization::FILTER_1X1_STRIDE1_PAD0)
|
||||
.with_block_gemm(cku::BlockGemmDesc_v2_intrawave);
|
||||
.with_block_gemm(cku::BlockGemmDesc_v2_intrawave)
|
||||
.with_num_conv_groups_to_merge(1);
|
||||
|
||||
using Builder = ckb::ConvBuilder<SIGNATURE, ALGORITHM>;
|
||||
using Instance = Builder::Instance;
|
||||
|
||||
Reference in New Issue
Block a user