Merge commit '8681ced9629f6e952afa5b77c5f3549d60920efa' into develop

This commit is contained in:
assistant-librarian[bot]
2025-11-04 14:12:38 +00:00
parent 58d420c0a4
commit 5b7defb9da
14 changed files with 230 additions and 219 deletions

View File

@@ -19,7 +19,7 @@
namespace ck_tile {
/// @brief The Grouped Convolution kernel device arguments.
template <typename GroupedConvTraitsType_>
template <typename GroupedConvTraitsType_, typename CDElementwise_>
struct GroupedConvFwdKernelArgs
{
@@ -31,7 +31,7 @@ struct GroupedConvFwdKernelArgs
GroupedConvTraitsType_::VectorSizeC,
GroupedConvTraitsType_::NumGroupsToMerge,
true>; // Split N enabled
using CDElementwise = typename GroupedConvTraitsType_::CDElementwise;
using CDElementwise = CDElementwise_;
static constexpr index_t NumDTensor = GroupedConvTraitsType_::NumDTensor;
template <
@@ -469,7 +469,8 @@ struct GroupedConvolutionForwardKernel
using CDElementwise = typename EpiloguePipeline::CDElementwise;
using GroupedConvFwdKernelArgsSpecialized = GroupedConvFwdKernelArgs<GroupedConvTraitsType_>;
using GroupedConvFwdKernelArgsSpecialized =
GroupedConvFwdKernelArgs<GroupedConvTraitsType_, CDElementwise>;
static constexpr bool IsSplitKSupported = false;