mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-05-16 19:09:59 +00:00
* conv3d compiles but has memory error
* conv3d works
* fix performance issue by using __builtin_amdgc_readfirstlane
* change MakeBlock2CTileMap to MakeDefaultBlock2CTileMap; change c_blockid_to* to cblockid_to*
* clang-format
* remove CK_EXPERIMENTAL_PASS_TENSOR_DECRIPTOR_BY_*; moved wrapper into DeviceConv3d
* format
* remove useless marc
* add comment
Co-authored-by: Chao Liu <chao.liu2@amd.com>
[ROCm/composable_kernel commit: 6dfb92bbef]
51 lines
1.5 KiB
C++
51 lines
1.5 KiB
C++
#ifndef CK_INTEGRAL_CONSTANT_HPP
|
|
#define CK_INTEGRAL_CONSTANT_HPP
|
|
|
|
namespace ck {
|
|
|
|
template <class T, T v>
|
|
struct integral_constant
|
|
{
|
|
static constexpr T value = v;
|
|
typedef T value_type;
|
|
typedef integral_constant type;
|
|
__host__ __device__ constexpr operator value_type() const noexcept { return value; }
|
|
__host__ __device__ constexpr value_type operator()() const noexcept { return value; }
|
|
};
|
|
|
|
template <typename TX, TX X, typename TY, TY Y>
|
|
__host__ __device__ constexpr auto operator+(integral_constant<TX, X>, integral_constant<TY, Y>)
|
|
{
|
|
return integral_constant<decltype(X + Y), X + Y>{};
|
|
}
|
|
|
|
template <typename TX, TX X, typename TY, TY Y>
|
|
__host__ __device__ constexpr auto operator-(integral_constant<TX, X>, integral_constant<TY, Y>)
|
|
{
|
|
static_assert(Y <= X, "wrong!");
|
|
return integral_constant<decltype(X - Y), X - Y>{};
|
|
}
|
|
|
|
template <typename TX, TX X, typename TY, TY Y>
|
|
__host__ __device__ constexpr auto operator*(integral_constant<TX, X>, integral_constant<TY, Y>)
|
|
{
|
|
return integral_constant<decltype(X * Y), X * Y>{};
|
|
}
|
|
|
|
template <typename TX, TX X, typename TY, TY Y>
|
|
__host__ __device__ constexpr auto operator/(integral_constant<TX, X>, integral_constant<TY, Y>)
|
|
{
|
|
static_assert(Y > 0, "wrong!");
|
|
return integral_constant<decltype(X / Y), X / Y>{};
|
|
}
|
|
|
|
template <typename TX, TX X, typename TY, TY Y>
|
|
__host__ __device__ constexpr auto operator%(integral_constant<TX, X>, integral_constant<TY, Y>)
|
|
{
|
|
static_assert(Y > 0, "wrong!");
|
|
return integral_constant<decltype(X % Y), X % Y>{};
|
|
}
|
|
|
|
} // namespace ck
|
|
#endif
|