diff --git a/example/20_grouped_conv_bwd_weight/grouped_conv_bwd_weight_v3_wmma_bf16.cpp b/example/20_grouped_conv_bwd_weight/grouped_conv_bwd_weight_v3_wmma_bf16.cpp index 2b6f145baa..6e6b877b16 100644 --- a/example/20_grouped_conv_bwd_weight/grouped_conv_bwd_weight_v3_wmma_bf16.cpp +++ b/example/20_grouped_conv_bwd_weight/grouped_conv_bwd_weight_v3_wmma_bf16.cpp @@ -17,7 +17,6 @@ using OutElementOp = PassThrough; template using DeviceConvBwdWeightInstance = - // clang-format on ck::tensor_operation::device::DeviceGroupedConvBwdWeight_Wmma_CShuffleV3< NDimSpatial, ck::tuple_element_t, // CShuffleBlockTransferClusterLengths_MBlock_MPerBlock_NBlock_NPerBlock - 128 / (sizeof(WeiDataType) * CHAR_BIT)>; // CBlockTransferScalarPerVector_NWaveNPerXdl - // clang-format off + 2>; // CShuffleBlockTransferScalarPerVector_NPerBlock template using HostConvBwdWeightInstance = ck::tensor_operation::host::ReferenceConvBwdWeight