mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-06-30 11:47:48 +00:00
36 lines
1.7 KiB
C++
36 lines
1.7 KiB
C++
#include <iostream>
|
|
|
|
#include <hip/hip_runtime.h>
|
|
|
|
#include "convolution_builder.hpp"
|
|
|
|
// Example of problem description for Forward Conv with default settings
|
|
struct GroupedConvFwdXdlImplicitGemm : public GroupedConvBaseXdlV1 {
|
|
static constexpr ConvolutionDirection ConvolutionDirection_ = ConvolutionDirection::Forward;
|
|
static constexpr ElementwiseOperation ElementwiseOperation_ = ElementwiseOperation::Bias;
|
|
};
|
|
|
|
// Example of problem description for Backward Weight Conv with default settings and Split K Two Stage
|
|
struct GroupedConvBwdWeightXdlImplicitGemmTwoStage : public GroupedConvBaseXdlV1 {
|
|
static constexpr ConvolutionDirection ConvolutionDirection_ = ConvolutionDirection::BackwardWeight;
|
|
static constexpr SplitKSupport SplitKSupport_ = SplitKSupport::SupportedTwoStage;
|
|
};
|
|
|
|
struct ImplementationDescriptor : public NHWCImplementationBaseV1, public BF16ImplementationBaseV1 {
|
|
static constexpr ck::index_t BlockSize_ = 64;
|
|
static constexpr auto TileSizes_ = std::make_tuple(16, 16, 32);
|
|
static constexpr ck::index_t K1_ = 8;
|
|
static constexpr MFMAInstructionSize MFMAInstructionSize_ = MFMAInstructionSize::M16N16;
|
|
static constexpr auto XdlPerWave_ = std::make_tuple(16, 16);
|
|
static constexpr auto GlobalTransferVectorSize_ = std::make_tuple(1, 1, 1);
|
|
static constexpr auto LDSStoreVectorSize_ = std::make_tuple(4, 4);
|
|
};
|
|
|
|
int main () {
|
|
ConvolutionBuilder<GroupedConvFwdXdlImplicitGemm, ImplementationDescriptor> builder_fwd;
|
|
std::cout << builder_fwd.GetInstanceName() << std::endl;
|
|
ConvolutionBuilder<GroupedConvBwdWeightXdlImplicitGemmTwoStage, ImplementationDescriptor> builder_bwd_weight_two_stage;
|
|
std::cout << builder_bwd_weight_two_stage.GetInstanceName() << std::endl;
|
|
return 0;
|
|
}
|