mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-05-17 03:19:48 +00:00
Refactor device op implementations into impl subdirectory. (#420)
* Move kernel implementation files under impl directory.
* Update examples paths.
* Update device kernel impl include paths.
* Update tensor operation instances include paths.
* Update profiler and tests include paths.
* Clang-format
* Update include paths for batched gemm reduce
* Refactor UnitTest ConvNDBwdWeight.
* Refactor fwd and bwd data convND UT.
* Fix used test macro.
* Fix include path.
* Fix include paths.
* Fix include paths in profiler and tests.
* Fix include paths.
Co-authored-by: Adam Osewski <aosewski@amd.com>
[ROCm/composable_kernel commit: 3048028897]
This commit is contained in:
@@ -5,7 +5,7 @@
|
||||
|
||||
#include <vector>
|
||||
#include "ck/tensor_operation/gpu/device/gemm_specialization.hpp"
|
||||
#include "ck/tensor_operation/gpu/device/device_batched_gemm_gemm_xdl_cshuffle.hpp"
|
||||
#include "ck/tensor_operation/gpu/device/impl/device_batched_gemm_gemm_xdl_cshuffle.hpp"
|
||||
#include "profiler/include/profile_batched_gemm_gemm_impl.hpp"
|
||||
|
||||
using ck::tensor_operation::device::GemmSpecialization;
|
||||
|
||||
@@ -5,7 +5,7 @@
|
||||
|
||||
#include <vector>
|
||||
#include "ck/tensor_operation/gpu/device/gemm_specialization.hpp"
|
||||
#include "ck/tensor_operation/gpu/device/device_batched_gemm_softmax_gemm_permute_xdl_cshuffle.hpp"
|
||||
#include "ck/tensor_operation/gpu/device/impl/device_batched_gemm_softmax_gemm_permute_xdl_cshuffle.hpp"
|
||||
#include "profiler/include/profile_batched_gemm_masking_scale_softmax_gemm_permute_impl.hpp"
|
||||
using ck::tensor_operation::device::GemmSpecialization;
|
||||
|
||||
|
||||
@@ -5,7 +5,7 @@
|
||||
|
||||
#include <vector>
|
||||
#include "ck/tensor_operation/gpu/device/gemm_specialization.hpp"
|
||||
#include "ck/tensor_operation/gpu/device/device_batched_gemm_softmax_gemm_xdl_cshuffle.hpp"
|
||||
#include "ck/tensor_operation/gpu/device/impl/device_batched_gemm_softmax_gemm_xdl_cshuffle.hpp"
|
||||
#include "profiler/include/profile_batched_gemm_softmax_gemm_impl.hpp"
|
||||
using ck::tensor_operation::device::GemmSpecialization;
|
||||
|
||||
|
||||
@@ -5,237 +5,89 @@
|
||||
#include <iostream>
|
||||
#include <initializer_list>
|
||||
#include <vector>
|
||||
#include <tuple>
|
||||
#include <gtest/gtest.h>
|
||||
|
||||
#include "profiler/include/profile_conv_bwd_data_impl.hpp"
|
||||
|
||||
template <typename Tuple>
|
||||
class TestConvndBwdData : public ::testing::Test
|
||||
{
|
||||
protected:
|
||||
using DataType = std::tuple_element_t<0, Tuple>;
|
||||
std::vector<ck::utils::conv::ConvParam> conv_params;
|
||||
|
||||
template <ck::index_t NDimSpatial>
|
||||
void Run()
|
||||
{
|
||||
for(auto& param : conv_params)
|
||||
{
|
||||
bool pass;
|
||||
EXPECT_FALSE(conv_params.empty());
|
||||
pass = ck::profiler::profile_conv_bwd_data_impl<
|
||||
NDimSpatial,
|
||||
ck::tuple_element_t<NDimSpatial - 1,
|
||||
ck::Tuple<ck::tensor_layout::convolution::NWC,
|
||||
ck::tensor_layout::convolution::NHWC,
|
||||
ck::tensor_layout::convolution::NDHWC>>,
|
||||
ck::tuple_element_t<NDimSpatial - 1,
|
||||
ck::Tuple<ck::tensor_layout::convolution::KXC,
|
||||
ck::tensor_layout::convolution::KYXC,
|
||||
ck::tensor_layout::convolution::KZYXC>>,
|
||||
ck::tuple_element_t<NDimSpatial - 1,
|
||||
ck::Tuple<ck::tensor_layout::convolution::NWK,
|
||||
ck::tensor_layout::convolution::NHWK,
|
||||
ck::tensor_layout::convolution::NDHWK>>,
|
||||
DataType,
|
||||
DataType,
|
||||
DataType>(true, // do_verification
|
||||
1, // init_method integer value
|
||||
false, // do_log
|
||||
false, // time_kernel
|
||||
param);
|
||||
EXPECT_TRUE(pass);
|
||||
}
|
||||
}
|
||||
};
|
||||
|
||||
using KernelTypes = ::testing::Types<std::tuple<float>,
|
||||
std::tuple<ck::half_t>,
|
||||
std::tuple<ck::bhalf_t>,
|
||||
std::tuple<std::int8_t>>;
|
||||
TYPED_TEST_SUITE(TestConvndBwdData, KernelTypes);
|
||||
|
||||
// 1d
|
||||
TEST_F(TestConvndBwdData, Conv1dBwdData)
|
||||
TYPED_TEST(TestConvndBwdData, Conv1dBwdData)
|
||||
{
|
||||
conv_params.clear();
|
||||
conv_params.push_back({1, 1, 128, 128, 256, {1}, {14}, {2}, {1}, {0}, {0}});
|
||||
conv_params.push_back({1, 1, 128, 128, 256, {3}, {28}, {1}, {1}, {1}, {1}});
|
||||
conv_params.push_back({1, 1, 128, 128, 256, {1}, {3}, {1}, {1}, {0}, {0}});
|
||||
|
||||
for(auto& param : conv_params)
|
||||
{
|
||||
bool pass;
|
||||
|
||||
// fp32
|
||||
pass = ck::profiler::profile_conv_bwd_data_impl<1,
|
||||
ck::tensor_layout::convolution::NWC,
|
||||
ck::tensor_layout::convolution::KXC,
|
||||
ck::tensor_layout::convolution::NWK,
|
||||
float,
|
||||
float,
|
||||
float>(true, // do_verification
|
||||
1, // init_method
|
||||
false, // do_log
|
||||
false, // time_kernel
|
||||
param);
|
||||
|
||||
EXPECT_TRUE(pass);
|
||||
|
||||
// fp16
|
||||
pass = ck::profiler::profile_conv_bwd_data_impl<1,
|
||||
ck::tensor_layout::convolution::NWC,
|
||||
ck::tensor_layout::convolution::KXC,
|
||||
ck::tensor_layout::convolution::NWK,
|
||||
ck::half_t,
|
||||
ck::half_t,
|
||||
ck::half_t>(true, // do_verification
|
||||
1, // init_method
|
||||
false, // do_log
|
||||
false, // time_kernel
|
||||
param);
|
||||
|
||||
EXPECT_TRUE(pass);
|
||||
|
||||
// bf16
|
||||
pass = ck::profiler::profile_conv_bwd_data_impl<1,
|
||||
ck::tensor_layout::convolution::NWC,
|
||||
ck::tensor_layout::convolution::KXC,
|
||||
ck::tensor_layout::convolution::NWK,
|
||||
ck::bhalf_t,
|
||||
ck::bhalf_t,
|
||||
ck::bhalf_t>(true, // do_verification
|
||||
1, // init_method
|
||||
false, // do_log
|
||||
false, // time_kernel
|
||||
param);
|
||||
|
||||
EXPECT_TRUE(pass);
|
||||
|
||||
// int8
|
||||
pass = ck::profiler::profile_conv_bwd_data_impl<1,
|
||||
ck::tensor_layout::convolution::NWC,
|
||||
ck::tensor_layout::convolution::KXC,
|
||||
ck::tensor_layout::convolution::NWK,
|
||||
int8_t,
|
||||
int8_t,
|
||||
int8_t>(true, // do_verification
|
||||
1, // init_method
|
||||
false, // do_log
|
||||
false, // time_kernel
|
||||
param);
|
||||
|
||||
EXPECT_TRUE(pass);
|
||||
}
|
||||
this->conv_params.clear();
|
||||
this->conv_params.push_back({1, 1, 128, 128, 256, {1}, {14}, {2}, {1}, {0}, {0}});
|
||||
this->conv_params.push_back({1, 1, 128, 128, 256, {3}, {28}, {1}, {1}, {1}, {1}});
|
||||
this->conv_params.push_back({1, 1, 128, 128, 256, {1}, {3}, {1}, {1}, {0}, {0}});
|
||||
this->template Run<1>();
|
||||
}
|
||||
|
||||
// 2d
|
||||
TEST_F(TestConvndBwdData, Conv2dBwdData)
|
||||
TYPED_TEST(TestConvndBwdData, Conv2dBwdData)
|
||||
{
|
||||
conv_params.clear();
|
||||
conv_params.push_back({2, 1, 128, 128, 256, {1, 1}, {7, 7}, {2, 2}, {1, 1}, {0, 0}, {0, 0}});
|
||||
conv_params.push_back({2, 1, 128, 128, 256, {3, 3}, {14, 14}, {1, 1}, {1, 1}, {1, 1}, {1, 1}});
|
||||
conv_params.push_back({2, 1, 128, 128, 256, {1, 1}, {3, 3}, {1, 1}, {1, 1}, {0, 0}, {0, 0}});
|
||||
|
||||
for(auto& param : conv_params)
|
||||
{
|
||||
bool pass;
|
||||
|
||||
// fp32
|
||||
pass = ck::profiler::profile_conv_bwd_data_impl<2,
|
||||
ck::tensor_layout::convolution::NHWC,
|
||||
ck::tensor_layout::convolution::KYXC,
|
||||
ck::tensor_layout::convolution::NHWK,
|
||||
float,
|
||||
float,
|
||||
float>(true, // do_verification
|
||||
1, // init_method
|
||||
false, // do_log
|
||||
false, // time_kernel
|
||||
param);
|
||||
|
||||
EXPECT_TRUE(pass);
|
||||
|
||||
// fp16
|
||||
pass = ck::profiler::profile_conv_bwd_data_impl<2,
|
||||
ck::tensor_layout::convolution::NHWC,
|
||||
ck::tensor_layout::convolution::KYXC,
|
||||
ck::tensor_layout::convolution::NHWK,
|
||||
ck::half_t,
|
||||
ck::half_t,
|
||||
ck::half_t>(true, // do_verification
|
||||
1, // init_method
|
||||
false, // do_log
|
||||
false, // time_kernel
|
||||
param);
|
||||
|
||||
EXPECT_TRUE(pass);
|
||||
|
||||
// bf16
|
||||
pass = ck::profiler::profile_conv_bwd_data_impl<2,
|
||||
ck::tensor_layout::convolution::NHWC,
|
||||
ck::tensor_layout::convolution::KYXC,
|
||||
ck::tensor_layout::convolution::NHWK,
|
||||
ck::bhalf_t,
|
||||
ck::bhalf_t,
|
||||
ck::bhalf_t>(true, // do_verification
|
||||
1, // init_method
|
||||
false, // do_log
|
||||
false, // time_kernel
|
||||
param);
|
||||
|
||||
EXPECT_TRUE(pass);
|
||||
|
||||
// int8
|
||||
pass = ck::profiler::profile_conv_bwd_data_impl<2,
|
||||
ck::tensor_layout::convolution::NHWC,
|
||||
ck::tensor_layout::convolution::KYXC,
|
||||
ck::tensor_layout::convolution::NHWK,
|
||||
int8_t,
|
||||
int8_t,
|
||||
int8_t>(true, // do_verification
|
||||
1, // init_method
|
||||
false, // do_log
|
||||
false, // time_kernel
|
||||
param);
|
||||
|
||||
EXPECT_TRUE(pass);
|
||||
}
|
||||
this->conv_params.clear();
|
||||
this->conv_params.push_back(
|
||||
{2, 1, 128, 128, 256, {1, 1}, {7, 7}, {2, 2}, {1, 1}, {0, 0}, {0, 0}});
|
||||
this->conv_params.push_back(
|
||||
{2, 1, 128, 128, 256, {3, 3}, {14, 14}, {1, 1}, {1, 1}, {1, 1}, {1, 1}});
|
||||
this->conv_params.push_back(
|
||||
{2, 1, 128, 128, 256, {1, 1}, {3, 3}, {1, 1}, {1, 1}, {0, 0}, {0, 0}});
|
||||
this->template Run<2>();
|
||||
}
|
||||
|
||||
// 3d
|
||||
TEST_F(TestConvndBwdData, Conv3dBwdData)
|
||||
TYPED_TEST(TestConvndBwdData, Conv3dBwdData)
|
||||
{
|
||||
conv_params.clear();
|
||||
conv_params.push_back(
|
||||
this->conv_params.clear();
|
||||
this->conv_params.push_back(
|
||||
{3, 1, 128, 128, 256, {1, 1, 1}, {7, 7, 7}, {2, 2, 2}, {1, 1, 1}, {0, 0, 0}, {0, 0, 0}});
|
||||
conv_params.push_back(
|
||||
this->conv_params.push_back(
|
||||
{3, 1, 128, 128, 256, {3, 3, 3}, {14, 14, 3}, {1, 1, 1}, {1, 1, 1}, {1, 1, 1}, {1, 1, 1}});
|
||||
conv_params.push_back(
|
||||
this->conv_params.push_back(
|
||||
{3, 1, 128, 128, 256, {1, 1, 1}, {3, 3, 3}, {1, 1, 1}, {1, 1, 1}, {0, 0, 0}, {0, 0, 0}});
|
||||
|
||||
for(auto& param : conv_params)
|
||||
{
|
||||
bool pass;
|
||||
|
||||
// fp32
|
||||
pass = ck::profiler::profile_conv_bwd_data_impl<3,
|
||||
ck::tensor_layout::convolution::NDHWC,
|
||||
ck::tensor_layout::convolution::KZYXC,
|
||||
ck::tensor_layout::convolution::NDHWK,
|
||||
float,
|
||||
float,
|
||||
float>(true, // do_verification
|
||||
1, // init_method
|
||||
false, // do_log
|
||||
false, // time_kernel
|
||||
param);
|
||||
|
||||
EXPECT_TRUE(pass);
|
||||
|
||||
// fp16
|
||||
pass = ck::profiler::profile_conv_bwd_data_impl<3,
|
||||
ck::tensor_layout::convolution::NDHWC,
|
||||
ck::tensor_layout::convolution::KZYXC,
|
||||
ck::tensor_layout::convolution::NDHWK,
|
||||
ck::half_t,
|
||||
ck::half_t,
|
||||
ck::half_t>(true, // do_verification
|
||||
1, // init_method
|
||||
false, // do_log
|
||||
false, // time_kernel
|
||||
param);
|
||||
|
||||
EXPECT_TRUE(pass);
|
||||
|
||||
// bf16
|
||||
pass = ck::profiler::profile_conv_bwd_data_impl<3,
|
||||
ck::tensor_layout::convolution::NDHWC,
|
||||
ck::tensor_layout::convolution::KZYXC,
|
||||
ck::tensor_layout::convolution::NDHWK,
|
||||
ck::bhalf_t,
|
||||
ck::bhalf_t,
|
||||
ck::bhalf_t>(true, // do_verification
|
||||
1, // init_method
|
||||
false, // do_log
|
||||
false, // time_kernel
|
||||
param);
|
||||
|
||||
EXPECT_TRUE(pass);
|
||||
|
||||
// int8
|
||||
pass = ck::profiler::profile_conv_bwd_data_impl<3,
|
||||
ck::tensor_layout::convolution::NDHWC,
|
||||
ck::tensor_layout::convolution::KZYXC,
|
||||
ck::tensor_layout::convolution::NDHWK,
|
||||
int8_t,
|
||||
int8_t,
|
||||
int8_t>(true, // do_verification
|
||||
1, // init_method
|
||||
false, // do_log
|
||||
false, // time_kernel
|
||||
param);
|
||||
|
||||
EXPECT_TRUE(pass);
|
||||
}
|
||||
this->template Run<3>();
|
||||
}
|
||||
|
||||
@@ -5,201 +5,86 @@
|
||||
#include <iostream>
|
||||
#include <initializer_list>
|
||||
#include <vector>
|
||||
#include <tuple>
|
||||
#include <gtest/gtest.h>
|
||||
|
||||
#include "profiler/include/profile_conv_bwd_weight_impl.hpp"
|
||||
|
||||
template <typename Tuple>
|
||||
class TestConvndBwdWeight : public ::testing::Test
|
||||
{
|
||||
protected:
|
||||
using DataType = std::tuple_element_t<0, Tuple>;
|
||||
std::vector<ck::utils::conv::ConvParam> conv_params;
|
||||
ck::index_t split_k{2};
|
||||
|
||||
template <ck::index_t NDimSpatial>
|
||||
void Run()
|
||||
{
|
||||
for(auto& param : conv_params)
|
||||
{
|
||||
bool pass;
|
||||
EXPECT_FALSE(conv_params.empty());
|
||||
pass = ck::profiler::profile_conv_bwd_weight_impl<
|
||||
NDimSpatial,
|
||||
ck::tuple_element_t<NDimSpatial - 1,
|
||||
ck::Tuple<ck::tensor_layout::convolution::NWC,
|
||||
ck::tensor_layout::convolution::NHWC,
|
||||
ck::tensor_layout::convolution::NDHWC>>,
|
||||
ck::tuple_element_t<NDimSpatial - 1,
|
||||
ck::Tuple<ck::tensor_layout::convolution::KXC,
|
||||
ck::tensor_layout::convolution::KYXC,
|
||||
ck::tensor_layout::convolution::KZYXC>>,
|
||||
ck::tuple_element_t<NDimSpatial - 1,
|
||||
ck::Tuple<ck::tensor_layout::convolution::NWK,
|
||||
ck::tensor_layout::convolution::NHWK,
|
||||
ck::tensor_layout::convolution::NDHWK>>,
|
||||
DataType,
|
||||
DataType,
|
||||
DataType>(true, // do_verification
|
||||
1, // init_method integer value
|
||||
false, // do_log
|
||||
false, // time_kernel
|
||||
param,
|
||||
split_k);
|
||||
EXPECT_TRUE(pass);
|
||||
}
|
||||
}
|
||||
};
|
||||
|
||||
// 1d
|
||||
TEST_F(TestConvndBwdWeight, Conv1dBwdWeight)
|
||||
using KernelTypes =
|
||||
::testing::Types<std::tuple<float>, std::tuple<ck::half_t>, std::tuple<ck::bhalf_t>>;
|
||||
TYPED_TEST_SUITE(TestConvndBwdWeight, KernelTypes);
|
||||
|
||||
TYPED_TEST(TestConvndBwdWeight, Test1D)
|
||||
{
|
||||
conv_params.clear();
|
||||
conv_params.push_back({1, 1, 128, 128, 256, {1}, {14}, {2}, {1}, {0}, {0}});
|
||||
conv_params.push_back({1, 1, 128, 128, 256, {3}, {28}, {1}, {1}, {1}, {1}});
|
||||
conv_params.push_back({1, 1, 128, 128, 256, {1}, {3}, {1}, {1}, {0}, {0}});
|
||||
|
||||
for(auto& param : conv_params)
|
||||
{
|
||||
bool pass;
|
||||
|
||||
// fp32
|
||||
pass = ck::profiler::profile_conv_bwd_weight_impl<1,
|
||||
ck::tensor_layout::convolution::NWC,
|
||||
ck::tensor_layout::convolution::KXC,
|
||||
ck::tensor_layout::convolution::NWK,
|
||||
float,
|
||||
float,
|
||||
float>(true, // do_verification
|
||||
1, // init_method
|
||||
false, // do_log
|
||||
false, // time_kernel
|
||||
param,
|
||||
2);
|
||||
|
||||
EXPECT_TRUE(pass);
|
||||
|
||||
// fp16
|
||||
pass = ck::profiler::profile_conv_bwd_weight_impl<1,
|
||||
ck::tensor_layout::convolution::NWC,
|
||||
ck::tensor_layout::convolution::KXC,
|
||||
ck::tensor_layout::convolution::NWK,
|
||||
ck::half_t,
|
||||
ck::half_t,
|
||||
ck::half_t>(true, // do_verification
|
||||
1, // init_method
|
||||
false, // do_log
|
||||
false, // time_kernel
|
||||
param,
|
||||
2);
|
||||
|
||||
EXPECT_TRUE(pass);
|
||||
|
||||
// bf16
|
||||
pass = ck::profiler::profile_conv_bwd_weight_impl<1,
|
||||
ck::tensor_layout::convolution::NWC,
|
||||
ck::tensor_layout::convolution::KXC,
|
||||
ck::tensor_layout::convolution::NWK,
|
||||
ck::bhalf_t,
|
||||
ck::bhalf_t,
|
||||
ck::bhalf_t>(true, // do_verification
|
||||
1, // init_method
|
||||
false, // do_log
|
||||
false, // time_kernel
|
||||
param,
|
||||
2);
|
||||
|
||||
EXPECT_TRUE(pass);
|
||||
}
|
||||
this->conv_params.clear();
|
||||
this->conv_params.push_back({1, 1, 128, 128, 256, {1}, {14}, {2}, {1}, {0}, {0}});
|
||||
this->conv_params.push_back({1, 1, 128, 128, 256, {3}, {28}, {1}, {1}, {1}, {1}});
|
||||
this->conv_params.push_back({1, 1, 128, 128, 256, {1}, {3}, {1}, {1}, {0}, {0}});
|
||||
this->template Run<1>();
|
||||
}
|
||||
|
||||
// 2d
|
||||
TEST_F(TestConvndBwdWeight, Conv2dBwdWeight)
|
||||
TYPED_TEST(TestConvndBwdWeight, Test2D)
|
||||
{
|
||||
conv_params.clear();
|
||||
conv_params.push_back({2, 1, 128, 128, 256, {1, 1}, {7, 7}, {2, 2}, {1, 1}, {0, 0}, {0, 0}});
|
||||
conv_params.push_back({2, 1, 32, 128, 256, {3, 3}, {14, 14}, {1, 1}, {1, 1}, {1, 1}, {1, 1}});
|
||||
conv_params.push_back({2, 1, 128, 128, 256, {1, 1}, {3, 3}, {1, 1}, {1, 1}, {0, 0}, {0, 0}});
|
||||
|
||||
for(auto& param : conv_params)
|
||||
{
|
||||
bool pass;
|
||||
|
||||
// fp32
|
||||
pass = ck::profiler::profile_conv_bwd_weight_impl<2,
|
||||
ck::tensor_layout::convolution::NHWC,
|
||||
ck::tensor_layout::convolution::KYXC,
|
||||
ck::tensor_layout::convolution::NHWK,
|
||||
float,
|
||||
float,
|
||||
float>(true, // do_verification
|
||||
1, // init_method
|
||||
false, // do_log
|
||||
false, // time_kernel
|
||||
param,
|
||||
2);
|
||||
|
||||
EXPECT_TRUE(pass);
|
||||
|
||||
// fp16
|
||||
pass = ck::profiler::profile_conv_bwd_weight_impl<2,
|
||||
ck::tensor_layout::convolution::NHWC,
|
||||
ck::tensor_layout::convolution::KYXC,
|
||||
ck::tensor_layout::convolution::NHWK,
|
||||
ck::half_t,
|
||||
ck::half_t,
|
||||
ck::half_t>(true, // do_verification
|
||||
1, // init_method
|
||||
false, // do_log
|
||||
false, // time_kernel
|
||||
param,
|
||||
2);
|
||||
|
||||
EXPECT_TRUE(pass);
|
||||
|
||||
// bf16
|
||||
pass = ck::profiler::profile_conv_bwd_weight_impl<2,
|
||||
ck::tensor_layout::convolution::NHWC,
|
||||
ck::tensor_layout::convolution::KYXC,
|
||||
ck::tensor_layout::convolution::NHWK,
|
||||
ck::bhalf_t,
|
||||
ck::bhalf_t,
|
||||
ck::bhalf_t>(true, // do_verification
|
||||
1, // init_method
|
||||
false, // do_log
|
||||
false, // time_kernel
|
||||
param,
|
||||
2);
|
||||
|
||||
EXPECT_TRUE(pass);
|
||||
}
|
||||
this->conv_params.clear();
|
||||
this->conv_params.push_back(
|
||||
{2, 1, 128, 128, 256, {1, 1}, {7, 7}, {2, 2}, {1, 1}, {0, 0}, {0, 0}});
|
||||
this->conv_params.push_back(
|
||||
{2, 1, 32, 128, 256, {3, 3}, {14, 14}, {1, 1}, {1, 1}, {1, 1}, {1, 1}});
|
||||
this->conv_params.push_back(
|
||||
{2, 1, 128, 128, 256, {1, 1}, {3, 3}, {1, 1}, {1, 1}, {0, 0}, {0, 0}});
|
||||
this->template Run<2>();
|
||||
}
|
||||
|
||||
// 3d
|
||||
TEST_F(TestConvndBwdWeight, Conv3dBwdWeight)
|
||||
TYPED_TEST(TestConvndBwdWeight, Test3D)
|
||||
{
|
||||
conv_params.clear();
|
||||
conv_params.push_back(
|
||||
this->conv_params.clear();
|
||||
this->conv_params.push_back(
|
||||
{3, 1, 128, 128, 256, {1, 1, 1}, {7, 7, 7}, {2, 2, 2}, {1, 1, 1}, {0, 0, 0}, {0, 0, 0}});
|
||||
conv_params.push_back(
|
||||
this->conv_params.push_back(
|
||||
{3, 1, 32, 128, 256, {3, 3, 3}, {14, 14, 3}, {1, 1, 1}, {1, 1, 1}, {1, 1, 1}, {1, 1, 1}});
|
||||
conv_params.push_back(
|
||||
this->conv_params.push_back(
|
||||
{3, 1, 128, 128, 256, {1, 1, 1}, {3, 3, 3}, {1, 1, 1}, {1, 1, 1}, {0, 0, 0}, {0, 0, 0}});
|
||||
|
||||
for(auto& param : conv_params)
|
||||
{
|
||||
bool pass;
|
||||
|
||||
// fp32
|
||||
pass = ck::profiler::profile_conv_bwd_weight_impl<3,
|
||||
ck::tensor_layout::convolution::NDHWC,
|
||||
ck::tensor_layout::convolution::KZYXC,
|
||||
ck::tensor_layout::convolution::NDHWK,
|
||||
float,
|
||||
float,
|
||||
float>(true, // do_verification
|
||||
1, // init_method
|
||||
false, // do_log
|
||||
false, // time_kernel
|
||||
param,
|
||||
2);
|
||||
|
||||
EXPECT_TRUE(pass);
|
||||
|
||||
// fp16
|
||||
pass = ck::profiler::profile_conv_bwd_weight_impl<3,
|
||||
ck::tensor_layout::convolution::NDHWC,
|
||||
ck::tensor_layout::convolution::KZYXC,
|
||||
ck::tensor_layout::convolution::NDHWK,
|
||||
ck::half_t,
|
||||
ck::half_t,
|
||||
ck::half_t>(true, // do_verification
|
||||
1, // init_method
|
||||
false, // do_log
|
||||
false, // time_kernel
|
||||
param,
|
||||
2);
|
||||
|
||||
EXPECT_TRUE(pass);
|
||||
|
||||
// bf16
|
||||
pass = ck::profiler::profile_conv_bwd_weight_impl<3,
|
||||
ck::tensor_layout::convolution::NDHWC,
|
||||
ck::tensor_layout::convolution::KZYXC,
|
||||
ck::tensor_layout::convolution::NDHWK,
|
||||
ck::bhalf_t,
|
||||
ck::bhalf_t,
|
||||
ck::bhalf_t>(true, // do_verification
|
||||
1, // init_method
|
||||
false, // do_log
|
||||
false, // time_kernel
|
||||
param,
|
||||
2);
|
||||
|
||||
EXPECT_TRUE(pass);
|
||||
}
|
||||
this->template Run<3>();
|
||||
}
|
||||
|
||||
@@ -5,237 +5,88 @@
|
||||
#include <iostream>
|
||||
#include <initializer_list>
|
||||
#include <vector>
|
||||
#include <tuple>
|
||||
#include <gtest/gtest.h>
|
||||
|
||||
#include "profiler/include/profile_conv_fwd_impl.hpp"
|
||||
|
||||
template <typename Tuple>
|
||||
class TestConvndFwd : public ::testing::Test
|
||||
{
|
||||
protected:
|
||||
using DataType = std::tuple_element_t<0, Tuple>;
|
||||
std::vector<ck::utils::conv::ConvParam> conv_params;
|
||||
|
||||
template <ck::index_t NDimSpatial>
|
||||
void Run()
|
||||
{
|
||||
for(auto& param : conv_params)
|
||||
{
|
||||
bool pass;
|
||||
EXPECT_FALSE(conv_params.empty());
|
||||
pass = ck::profiler::profile_conv_fwd_impl<
|
||||
NDimSpatial,
|
||||
ck::tuple_element_t<NDimSpatial - 1,
|
||||
ck::Tuple<ck::tensor_layout::convolution::NWC,
|
||||
ck::tensor_layout::convolution::NHWC,
|
||||
ck::tensor_layout::convolution::NDHWC>>,
|
||||
ck::tuple_element_t<NDimSpatial - 1,
|
||||
ck::Tuple<ck::tensor_layout::convolution::KXC,
|
||||
ck::tensor_layout::convolution::KYXC,
|
||||
ck::tensor_layout::convolution::KZYXC>>,
|
||||
ck::tuple_element_t<NDimSpatial - 1,
|
||||
ck::Tuple<ck::tensor_layout::convolution::NWK,
|
||||
ck::tensor_layout::convolution::NHWK,
|
||||
ck::tensor_layout::convolution::NDHWK>>,
|
||||
DataType,
|
||||
DataType,
|
||||
DataType>(true, // do_verification
|
||||
1, // init_method integer value
|
||||
false, // do_log
|
||||
false, // time_kernel
|
||||
param);
|
||||
EXPECT_TRUE(pass);
|
||||
}
|
||||
}
|
||||
};
|
||||
|
||||
using KernelTypes = ::testing::Types<std::tuple<float>,
|
||||
std::tuple<ck::half_t>,
|
||||
std::tuple<ck::bhalf_t>,
|
||||
std::tuple<std::int8_t>>;
|
||||
TYPED_TEST_SUITE(TestConvndFwd, KernelTypes);
|
||||
|
||||
// 1d
|
||||
TEST_F(TestConvndFwd, Conv1dFwd)
|
||||
TYPED_TEST(TestConvndFwd, Conv1dFwd)
|
||||
{
|
||||
conv_params.clear();
|
||||
conv_params.push_back({1, 1, 128, 128, 256, {1}, {14}, {2}, {1}, {0}, {0}});
|
||||
conv_params.push_back({1, 1, 128, 128, 256, {3}, {28}, {1}, {1}, {1}, {1}});
|
||||
conv_params.push_back({1, 1, 128, 128, 256, {1}, {3}, {1}, {1}, {0}, {0}});
|
||||
|
||||
for(auto& param : conv_params)
|
||||
{
|
||||
bool pass;
|
||||
|
||||
// fp32
|
||||
pass = ck::profiler::profile_conv_fwd_impl<1,
|
||||
ck::tensor_layout::convolution::NWC,
|
||||
ck::tensor_layout::convolution::KXC,
|
||||
ck::tensor_layout::convolution::NWK,
|
||||
float,
|
||||
float,
|
||||
float>(true, // do_verification
|
||||
1, // init_method
|
||||
false, // do_log
|
||||
false, // time_kernel
|
||||
param);
|
||||
|
||||
EXPECT_TRUE(pass);
|
||||
|
||||
// fp16
|
||||
pass = ck::profiler::profile_conv_fwd_impl<1,
|
||||
ck::tensor_layout::convolution::NWC,
|
||||
ck::tensor_layout::convolution::KXC,
|
||||
ck::tensor_layout::convolution::NWK,
|
||||
ck::half_t,
|
||||
ck::half_t,
|
||||
ck::half_t>(true, // do_verification
|
||||
1, // init_method
|
||||
false, // do_log
|
||||
false, // time_kernel
|
||||
param);
|
||||
|
||||
EXPECT_TRUE(pass);
|
||||
|
||||
// bf16
|
||||
pass = ck::profiler::profile_conv_fwd_impl<1,
|
||||
ck::tensor_layout::convolution::NWC,
|
||||
ck::tensor_layout::convolution::KXC,
|
||||
ck::tensor_layout::convolution::NWK,
|
||||
ck::bhalf_t,
|
||||
ck::bhalf_t,
|
||||
ck::bhalf_t>(true, // do_verification
|
||||
1, // init_method
|
||||
false, // do_log
|
||||
false, // time_kernel
|
||||
param);
|
||||
|
||||
EXPECT_TRUE(pass);
|
||||
|
||||
// int8
|
||||
pass = ck::profiler::profile_conv_fwd_impl<1,
|
||||
ck::tensor_layout::convolution::NWC,
|
||||
ck::tensor_layout::convolution::KXC,
|
||||
ck::tensor_layout::convolution::NWK,
|
||||
int8_t,
|
||||
int8_t,
|
||||
int8_t>(true, // do_verification
|
||||
1, // init_method
|
||||
false, // do_log
|
||||
false, // time_kernel
|
||||
param);
|
||||
|
||||
EXPECT_TRUE(pass);
|
||||
}
|
||||
this->conv_params.clear();
|
||||
this->conv_params.push_back({1, 1, 128, 128, 256, {1}, {14}, {2}, {1}, {0}, {0}});
|
||||
this->conv_params.push_back({1, 1, 128, 128, 256, {3}, {28}, {1}, {1}, {1}, {1}});
|
||||
this->conv_params.push_back({1, 1, 128, 128, 256, {1}, {3}, {1}, {1}, {0}, {0}});
|
||||
this->template Run<1>();
|
||||
}
|
||||
|
||||
// 2d
|
||||
TEST_F(TestConvndFwd, Conv2dFwd)
|
||||
TYPED_TEST(TestConvndFwd, Conv2dFwd)
|
||||
{
|
||||
conv_params.clear();
|
||||
conv_params.push_back({2, 1, 128, 128, 256, {1, 1}, {7, 7}, {2, 2}, {1, 1}, {0, 0}, {0, 0}});
|
||||
conv_params.push_back({2, 1, 128, 128, 256, {3, 3}, {14, 14}, {1, 1}, {1, 1}, {1, 1}, {1, 1}});
|
||||
conv_params.push_back({2, 1, 128, 128, 256, {1, 1}, {3, 3}, {1, 1}, {1, 1}, {0, 0}, {0, 0}});
|
||||
|
||||
for(auto& param : conv_params)
|
||||
{
|
||||
bool pass;
|
||||
|
||||
// fp32
|
||||
pass = ck::profiler::profile_conv_fwd_impl<2,
|
||||
ck::tensor_layout::convolution::NHWC,
|
||||
ck::tensor_layout::convolution::KYXC,
|
||||
ck::tensor_layout::convolution::NHWK,
|
||||
float,
|
||||
float,
|
||||
float>(true, // do_verification
|
||||
1, // init_method
|
||||
false, // do_log
|
||||
false, // time_kernel
|
||||
param);
|
||||
|
||||
EXPECT_TRUE(pass);
|
||||
|
||||
// fp16
|
||||
pass = ck::profiler::profile_conv_fwd_impl<2,
|
||||
ck::tensor_layout::convolution::NHWC,
|
||||
ck::tensor_layout::convolution::KYXC,
|
||||
ck::tensor_layout::convolution::NHWK,
|
||||
ck::half_t,
|
||||
ck::half_t,
|
||||
ck::half_t>(true, // do_verification
|
||||
1, // init_method
|
||||
false, // do_log
|
||||
false, // time_kernel
|
||||
param);
|
||||
|
||||
EXPECT_TRUE(pass);
|
||||
|
||||
// bf16
|
||||
pass = ck::profiler::profile_conv_fwd_impl<2,
|
||||
ck::tensor_layout::convolution::NHWC,
|
||||
ck::tensor_layout::convolution::KYXC,
|
||||
ck::tensor_layout::convolution::NHWK,
|
||||
ck::bhalf_t,
|
||||
ck::bhalf_t,
|
||||
ck::bhalf_t>(true, // do_verification
|
||||
1, // init_method
|
||||
false, // do_log
|
||||
false, // time_kernel
|
||||
param);
|
||||
|
||||
EXPECT_TRUE(pass);
|
||||
|
||||
// int8
|
||||
pass = ck::profiler::profile_conv_fwd_impl<2,
|
||||
ck::tensor_layout::convolution::NHWC,
|
||||
ck::tensor_layout::convolution::KYXC,
|
||||
ck::tensor_layout::convolution::NHWK,
|
||||
int8_t,
|
||||
int8_t,
|
||||
int8_t>(true, // do_verification
|
||||
1, // init_method
|
||||
false, // do_log
|
||||
false, // time_kernel
|
||||
param);
|
||||
|
||||
EXPECT_TRUE(pass);
|
||||
}
|
||||
this->conv_params.clear();
|
||||
this->conv_params.push_back(
|
||||
{2, 1, 128, 128, 256, {1, 1}, {7, 7}, {2, 2}, {1, 1}, {0, 0}, {0, 0}});
|
||||
this->conv_params.push_back(
|
||||
{2, 1, 128, 128, 256, {3, 3}, {14, 14}, {1, 1}, {1, 1}, {1, 1}, {1, 1}});
|
||||
this->conv_params.push_back(
|
||||
{2, 1, 128, 128, 256, {1, 1}, {3, 3}, {1, 1}, {1, 1}, {0, 0}, {0, 0}});
|
||||
this->template Run<2>();
|
||||
}
|
||||
|
||||
// 3d
|
||||
TEST_F(TestConvndFwd, Conv3dFwd)
|
||||
TYPED_TEST(TestConvndFwd, Conv3dFwd)
|
||||
{
|
||||
conv_params.clear();
|
||||
conv_params.push_back(
|
||||
this->conv_params.clear();
|
||||
this->conv_params.push_back(
|
||||
{3, 1, 128, 128, 256, {1, 1, 1}, {7, 7, 7}, {2, 2, 2}, {1, 1, 1}, {0, 0, 0}, {0, 0, 0}});
|
||||
conv_params.push_back(
|
||||
this->conv_params.push_back(
|
||||
{3, 1, 128, 128, 256, {3, 3, 3}, {14, 14, 3}, {1, 1, 1}, {1, 1, 1}, {1, 1, 1}, {1, 1, 1}});
|
||||
conv_params.push_back(
|
||||
this->conv_params.push_back(
|
||||
{3, 1, 128, 128, 256, {1, 1, 1}, {3, 3, 3}, {1, 1, 1}, {1, 1, 1}, {0, 0, 0}, {0, 0, 0}});
|
||||
|
||||
for(auto& param : conv_params)
|
||||
{
|
||||
bool pass;
|
||||
|
||||
// fp32
|
||||
pass = ck::profiler::profile_conv_fwd_impl<3,
|
||||
ck::tensor_layout::convolution::NDHWC,
|
||||
ck::tensor_layout::convolution::KZYXC,
|
||||
ck::tensor_layout::convolution::NDHWK,
|
||||
float,
|
||||
float,
|
||||
float>(true, // do_verification
|
||||
1, // init_method
|
||||
false, // do_log
|
||||
false, // time_kernel
|
||||
param);
|
||||
|
||||
EXPECT_TRUE(pass);
|
||||
|
||||
// fp16
|
||||
pass = ck::profiler::profile_conv_fwd_impl<3,
|
||||
ck::tensor_layout::convolution::NDHWC,
|
||||
ck::tensor_layout::convolution::KZYXC,
|
||||
ck::tensor_layout::convolution::NDHWK,
|
||||
ck::half_t,
|
||||
ck::half_t,
|
||||
ck::half_t>(true, // do_verification
|
||||
1, // init_method
|
||||
false, // do_log
|
||||
false, // time_kernel
|
||||
param);
|
||||
|
||||
EXPECT_TRUE(pass);
|
||||
|
||||
// bf16
|
||||
pass = ck::profiler::profile_conv_fwd_impl<3,
|
||||
ck::tensor_layout::convolution::NDHWC,
|
||||
ck::tensor_layout::convolution::KZYXC,
|
||||
ck::tensor_layout::convolution::NDHWK,
|
||||
ck::bhalf_t,
|
||||
ck::bhalf_t,
|
||||
ck::bhalf_t>(true, // do_verification
|
||||
1, // init_method
|
||||
false, // do_log
|
||||
false, // time_kernel
|
||||
param);
|
||||
|
||||
EXPECT_TRUE(pass);
|
||||
|
||||
// int8
|
||||
pass = ck::profiler::profile_conv_fwd_impl<3,
|
||||
ck::tensor_layout::convolution::NDHWC,
|
||||
ck::tensor_layout::convolution::KZYXC,
|
||||
ck::tensor_layout::convolution::NDHWK,
|
||||
int8_t,
|
||||
int8_t,
|
||||
int8_t>(true, // do_verification
|
||||
1, // init_method
|
||||
false, // do_log
|
||||
false, // time_kernel
|
||||
param);
|
||||
|
||||
EXPECT_TRUE(pass);
|
||||
}
|
||||
this->template Run<3>();
|
||||
}
|
||||
|
||||
@@ -9,7 +9,7 @@
|
||||
|
||||
#include "ck/ck.hpp"
|
||||
#include "ck/utility/number.hpp"
|
||||
#include "ck/tensor_operation/gpu/device/device_normalization_impl.hpp"
|
||||
#include "ck/tensor_operation/gpu/device/impl/device_normalization_impl.hpp"
|
||||
|
||||
#include "ck/library/utility/check_err.hpp"
|
||||
#include "ck/library/utility/host_tensor.hpp"
|
||||
|
||||
Reference in New Issue
Block a user