mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-05-20 21:09:08 +00:00
MaxPool & AvgPool bwd instances, test, ckProfiler, client example (#861)
* Add maxpool instances
* Rename index pool to max pool.
* Add maxpool bwd bf16 instances
* Add avg pool bwd instances
* Rename avgpool and maxpool to avg_pool3d and max_pool
* Add bf16 pool fwd instances
* Add max pool bwd to ckProfiler
* Add avg pool3d bwd to ckProfiler
* Add avg pool bwd test
* Fix bug of reference pool fwd (dilation)
* Fix bug of max pool bwd (dilation and initZero)
* Support bf16 compute data type
* Force compute type be f32. Because atomicAdd only support f32
* Add max pool bwd test
* Rename folder
* Rename pool
* Add max pool bwd client example
* Add avg pool bwd client example
* Add missing workspace
* clang format
* Rename macro
* remove useless header
* remove useless layout
[ROCm/composable_kernel commit: 866377de18]
This commit is contained in:
@@ -57,7 +57,7 @@ add_subdirectory(data_type)
|
||||
add_subdirectory(elementwise_normalization)
|
||||
add_subdirectory(batchnorm)
|
||||
add_subdirectory(contraction)
|
||||
add_subdirectory(pool_fwd)
|
||||
add_subdirectory(pool)
|
||||
add_subdirectory(batched_gemm_multi_d)
|
||||
add_subdirectory(grouped_convnd_bwd_data)
|
||||
if(GPU_TARGETS MATCHES "gfx11")
|
||||
|
||||
16
test/pool/CMakeLists.txt
Normal file
16
test/pool/CMakeLists.txt
Normal file
@@ -0,0 +1,16 @@
|
||||
add_custom_target(test_pool)
|
||||
|
||||
add_gtest_executable(test_avg_pool3d_bwd test_avg_pool3d_bwd.cpp)
|
||||
add_gtest_executable(test_max_pool3d_bwd test_max_pool3d_bwd.cpp)
|
||||
add_gtest_executable(test_avg_pool3d_fwd test_avg_pool3d_fwd.cpp)
|
||||
add_gtest_executable(test_max_pool3d_fwd test_max_pool3d_fwd.cpp)
|
||||
|
||||
target_link_libraries(test_avg_pool3d_bwd PRIVATE utility device_avg_pool3d_bwd_instance)
|
||||
target_link_libraries(test_max_pool3d_bwd PRIVATE utility device_max_pool_bwd_instance)
|
||||
target_link_libraries(test_avg_pool3d_fwd PRIVATE utility device_pool3d_fwd_instance)
|
||||
target_link_libraries(test_max_pool3d_fwd PRIVATE utility device_pool3d_fwd_instance)
|
||||
|
||||
add_dependencies(test_pool test_avg_pool3d_bwd)
|
||||
add_dependencies(test_pool test_max_pool3d_bwd)
|
||||
add_dependencies(test_pool test_avg_pool3d_fwd)
|
||||
add_dependencies(test_pool test_max_pool3d_fwd)
|
||||
74
test/pool/test_avg_pool3d_bwd.cpp
Normal file
74
test/pool/test_avg_pool3d_bwd.cpp
Normal file
@@ -0,0 +1,74 @@
|
||||
// SPDX-License-Identifier: MIT
|
||||
// Copyright (c) 2018-2023, Advanced Micro Devices, Inc. All rights reserved.
|
||||
|
||||
#include "gtest/gtest.h"
|
||||
#include "profiler/profile_avg_pool3d_bwd_impl.hpp"
|
||||
#include "test_pool_fwd_common.hpp"
|
||||
|
||||
template <typename Tuple>
|
||||
class TestAvgPool3dBwd : public ::testing::Test
|
||||
{
|
||||
protected:
|
||||
using DOutDataType = std::tuple_element_t<0, Tuple>;
|
||||
using DInDataType = std::tuple_element_t<1, Tuple>;
|
||||
using ComputeDataType = std::tuple_element_t<2, Tuple>;
|
||||
using DOutLayout = std::tuple_element_t<3, Tuple>;
|
||||
using DInLayout = std::tuple_element_t<4, Tuple>;
|
||||
|
||||
std::vector<PoolingParam> params;
|
||||
|
||||
void Run()
|
||||
{
|
||||
for(auto param : params)
|
||||
{
|
||||
bool success =
|
||||
ck::profiler::profile_avg_pool3d_bwd_impl<DOutDataType,
|
||||
DInDataType,
|
||||
ComputeDataType,
|
||||
DOutLayout,
|
||||
DInLayout>(true,
|
||||
2,
|
||||
false,
|
||||
false,
|
||||
param.length_,
|
||||
param.window_spatial_lengths_,
|
||||
param.window_strides_,
|
||||
param.window_dilations_,
|
||||
param.input_left_pads_,
|
||||
param.input_right_pads_);
|
||||
EXPECT_TRUE(success);
|
||||
}
|
||||
}
|
||||
};
|
||||
|
||||
#if defined(CK_ENABLE_FP16) && defined(CK_ENABLE_BF16) && defined(CK_ENABLE_FP32)
|
||||
using KernelTypes = ::testing::Types<std::tuple<F16, F16, F32, NDHWC, NDHWC>,
|
||||
std::tuple<BF16, BF16, F32, NDHWC, NDHWC>,
|
||||
std::tuple<F32, F32, F32, NDHWC, NDHWC>>;
|
||||
#elif defined(CK_ENABLE_FP16) && defined(CK_ENABLE_FP32)
|
||||
using KernelTypes = ::testing::Types<std::tuple<F16, F16, F32, NDHWC, NDHWC>,
|
||||
std::tuple<F32, F32, F32, NDHWC, NDHWC>>;
|
||||
#elif defined(CK_ENABLE_BF16) && defined(CK_ENABLE_FP32)
|
||||
using KernelTypes = ::testing::Types<std::tuple<BF16, BF16, F32, NDHWC, NDHWC>,
|
||||
std::tuple<F32, F32, F32, NDHWC, NDHWC>>;
|
||||
#elif defined(CK_ENABLE_FP16) && defined(CK_ENABLE_BF16)
|
||||
using KernelTypes = ::testing::Types<std::tuple<F16, F16, F32, NDHWC, NDHWC>,
|
||||
std::tuple<BF16, BF16, F32, NDHWC, NDHWC>>;
|
||||
#elif defined(CK_ENABLE_FP16)
|
||||
using KernelTypes = ::testing::Types<std::tuple<F16, F16, F32, NDHWC, NDHWC>>;
|
||||
#elif defined(CK_ENABLE_BF16)
|
||||
using KernelTypes = ::testing::Types<std::tuple<BF16, BF16, F32, NDHWC, NDHWC>>;
|
||||
#elif defined(CK_ENABLE_FP32)
|
||||
using KernelTypes = ::testing::Types<std::tuple<F32, F32, F32, NDHWC, NDHWC>>;
|
||||
#endif
|
||||
|
||||
TYPED_TEST_SUITE(TestAvgPool3dBwd, KernelTypes);
|
||||
TYPED_TEST(TestAvgPool3dBwd, Test_Pool)
|
||||
{
|
||||
// length, window_length, window_stride, window_dilation, left_pad, right_pad
|
||||
this->params = {{{1, 1, 1, 1, 1}, {1, 1, 1}, {1, 1, 1}, {1, 1, 1}, {0, 0, 0}, {0, 0, 0}},
|
||||
{{2, 16, 64, 64, 64}, {4, 4, 4}, {4, 4, 4}, {2, 2, 2}, {0, 0, 0}, {0, 0, 0}},
|
||||
{{2, 32, 30, 30, 30}, {2, 2, 2}, {2, 2, 2}, {1, 1, 1}, {1, 1, 1}, {1, 1, 1}}};
|
||||
|
||||
this->Run();
|
||||
}
|
||||
79
test/pool/test_max_pool3d_bwd.cpp
Normal file
79
test/pool/test_max_pool3d_bwd.cpp
Normal file
@@ -0,0 +1,79 @@
|
||||
// SPDX-License-Identifier: MIT
|
||||
// Copyright (c) 2018-2023, Advanced Micro Devices, Inc. All rights reserved.
|
||||
|
||||
#include "gtest/gtest.h"
|
||||
#include "profiler/profile_max_pool3d_bwd_impl.hpp"
|
||||
#include "test_pool_fwd_common.hpp"
|
||||
|
||||
template <typename Tuple>
|
||||
class TestMaxPool3dBwd : public ::testing::Test
|
||||
{
|
||||
protected:
|
||||
using DOutDataType = std::tuple_element_t<0, Tuple>;
|
||||
using DInDataType = std::tuple_element_t<1, Tuple>;
|
||||
using IndexDataType = std::tuple_element_t<2, Tuple>;
|
||||
|
||||
using InDataType = DInDataType;
|
||||
using OutDataType = DOutDataType;
|
||||
|
||||
std::vector<PoolingParam> params;
|
||||
|
||||
void Run()
|
||||
{
|
||||
for(auto param : params)
|
||||
{
|
||||
bool success =
|
||||
ck::profiler::profile_max_pool3d_bwd_impl<InDataType,
|
||||
OutDataType,
|
||||
IndexDataType,
|
||||
DOutDataType,
|
||||
DInDataType,
|
||||
false>(true,
|
||||
2,
|
||||
false,
|
||||
false,
|
||||
param.length_,
|
||||
param.window_spatial_lengths_,
|
||||
param.window_strides_,
|
||||
param.window_dilations_,
|
||||
param.input_left_pads_,
|
||||
param.input_right_pads_);
|
||||
EXPECT_TRUE(success);
|
||||
}
|
||||
}
|
||||
};
|
||||
|
||||
#if defined(CK_ENABLE_FP16) && defined(CK_ENABLE_BF16) && defined(CK_ENABLE_FP32)
|
||||
using KernelTypes = ::testing::Types<std::tuple<F16, F16, I32, NDHWC, NDHWC>,
|
||||
std::tuple<BF16, BF16, I32, NDHWC, NDHWC>,
|
||||
std::tuple<F32, F32, I32, NDHWC, NDHWC>>;
|
||||
#elif defined(CK_ENABLE_FP16) && defined(CK_ENABLE_FP32)
|
||||
using KernelTypes = ::testing::Types<std::tuple<F16, F16, I32, NDHWC, NDHWC>,
|
||||
std::tuple<F32, F32, I32, NDHWC, NDHWC>>;
|
||||
#elif defined(CK_ENABLE_BF16) && defined(CK_ENABLE_FP32)
|
||||
using KernelTypes = ::testing::Types<std::tuple<BF16, BF16, I32, NDHWC, NDHWC>,
|
||||
std::tuple<F32, F32, I32, NDHWC, NDHWC>>;
|
||||
#elif defined(CK_ENABLE_FP16) && defined(CK_ENABLE_BF16)
|
||||
using KernelTypes = ::testing::Types<std::tuple<F16, F16, I32, NDHWC, NDHWC>,
|
||||
std::tuple<BF16, BF16, I32, NDHWC, NDHWC>>;
|
||||
#elif defined(CK_ENABLE_FP16)
|
||||
using KernelTypes = ::testing::Types<std::tuple<F16, F16, I32, NDHWC, NDHWC>>;
|
||||
#elif defined(CK_ENABLE_BF16)
|
||||
using KernelTypes = ::testing::Types<std::tuple<BF16, BF16, I32, NDHWC, NDHWC>>;
|
||||
#elif defined(CK_ENABLE_FP32)
|
||||
using KernelTypes = ::testing::Types<std::tuple<F32, F32, I32, NDHWC, NDHWC>>;
|
||||
#endif
|
||||
|
||||
TYPED_TEST_SUITE(TestMaxPool3dBwd, KernelTypes);
|
||||
TYPED_TEST(TestMaxPool3dBwd, Test_Pool)
|
||||
{
|
||||
// length, window_length, window_stride, window_dilation, left_pad, right_pad
|
||||
this->params = {{{1, 1, 1, 1, 1}, {1, 1, 1}, {1, 1, 1}, {1, 1, 1}, {0, 0, 0}, {0, 0, 0}},
|
||||
{{2, 16, 64, 64, 64}, {4, 4, 4}, {4, 4, 4}, {2, 2, 2}, {0, 0, 0}, {0, 0, 0}},
|
||||
{{2, 32, 30, 30, 30}, {2, 2, 2}, {2, 2, 2}, {1, 1, 1}, {1, 1, 1}, {1, 1, 1}}};
|
||||
|
||||
// this->params = {{{2, 32, 30, 30, 30}, {2, 2, 2}, {2, 2, 2}, {1, 1, 1}, {1, 1, 1}, {1, 1,
|
||||
// 1}}};
|
||||
|
||||
this->Run();
|
||||
}
|
||||
@@ -4,10 +4,12 @@
|
||||
#include "gtest/gtest.h"
|
||||
#include "ck/ck.hpp"
|
||||
|
||||
using F16 = ck::half_t;
|
||||
using F32 = float;
|
||||
using I32 = int32_t;
|
||||
using F16 = ck::half_t;
|
||||
using BF16 = ck::bhalf_t;
|
||||
using F32 = float;
|
||||
using I32 = int32_t;
|
||||
using ck::index_t;
|
||||
using NDHWC = ck::tensor_layout::convolution::NDHWC;
|
||||
|
||||
struct PoolingParam
|
||||
{
|
||||
@@ -1,10 +0,0 @@
|
||||
add_custom_target(test_pool_fwd)
|
||||
|
||||
add_gtest_executable(test_avg_pool3d_fwd test_avg_pool3d_fwd.cpp)
|
||||
add_gtest_executable(test_max_pool3d_fwd test_max_pool3d_fwd.cpp)
|
||||
|
||||
target_link_libraries(test_avg_pool3d_fwd PRIVATE utility device_pool3d_fwd_instance)
|
||||
target_link_libraries(test_max_pool3d_fwd PRIVATE utility device_pool3d_fwd_instance)
|
||||
|
||||
add_dependencies(test_pool_fwd test_avg_pool3d_fwd)
|
||||
add_dependencies(test_pool_fwd test_max_pool3d_fwd)
|
||||
Reference in New Issue
Block a user