mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-05-14 18:17:44 +00:00
114 lines
2.3 KiB
C++
114 lines
2.3 KiB
C++
#pragma once
|
|
|
|
__device__ index_t get_thread_local_1d_id() { return threadIdx.x; }
|
|
|
|
__device__ index_t get_block_1d_id() { return blockIdx.x; }
|
|
|
|
template <class T1, class T2>
|
|
struct is_same
|
|
{
|
|
static constexpr bool value = false;
|
|
};
|
|
|
|
template <class T>
|
|
struct is_same<T, T>
|
|
{
|
|
static constexpr bool value = true;
|
|
};
|
|
|
|
template <class X, class Y>
|
|
__host__ __device__ constexpr bool is_same_type(X, Y)
|
|
{
|
|
return is_same<X, Y>::value;
|
|
}
|
|
|
|
namespace mod_conv { // namespace mod_conv
|
|
template <class T, T s>
|
|
struct scales
|
|
{
|
|
__host__ __device__ constexpr T operator()(T a) const { return s * a; }
|
|
};
|
|
|
|
template <class T>
|
|
struct plus
|
|
{
|
|
__host__ __device__ constexpr T operator()(T a, T b) const { return a + b; }
|
|
};
|
|
|
|
template <class T>
|
|
struct minus
|
|
{
|
|
__host__ __device__ constexpr T operator()(T a, T b) const { return a - b; }
|
|
};
|
|
|
|
template <class T>
|
|
struct multiplies
|
|
{
|
|
__host__ __device__ constexpr T operator()(T a, T b) const { return a * b; }
|
|
};
|
|
|
|
template <class T>
|
|
struct integer_divide_ceiler
|
|
{
|
|
__host__ __device__ constexpr T operator()(T a, T b) const
|
|
{
|
|
static_assert(is_same<T, index_t>::value || is_same<T, int>::value, "wrong type");
|
|
|
|
return (a + b - 1) / b;
|
|
}
|
|
};
|
|
|
|
template <class T>
|
|
__host__ __device__ constexpr T integer_divide_ceil(T a, T b)
|
|
{
|
|
static_assert(is_same<T, index_t>::value || is_same<T, int>::value, "wrong type");
|
|
|
|
return (a + b - 1) / b;
|
|
}
|
|
|
|
template <class T>
|
|
__host__ __device__ constexpr T max(T x, T y)
|
|
{
|
|
return x > y ? x : y;
|
|
}
|
|
|
|
template <class T, class... Ts>
|
|
__host__ __device__ constexpr T max(T x, Ts... xs)
|
|
{
|
|
static_assert(sizeof...(xs) > 0, "not enough argument");
|
|
|
|
auto y = max(xs...);
|
|
|
|
static_assert(is_same<decltype(y), T>::value, "not the same type");
|
|
|
|
return x > y ? x : y;
|
|
}
|
|
|
|
template <class T>
|
|
__host__ __device__ constexpr T min(T x, T y)
|
|
{
|
|
return x < y ? x : y;
|
|
}
|
|
|
|
template <class T, class... Ts>
|
|
__host__ __device__ constexpr T min(T x, Ts... xs)
|
|
{
|
|
static_assert(sizeof...(xs) > 0, "not enough argument");
|
|
|
|
auto y = min(xs...);
|
|
|
|
static_assert(is_same<decltype(y), T>::value, "not the same type");
|
|
|
|
return x < y ? x : y;
|
|
}
|
|
|
|
// this is wrong
|
|
// TODO: implement correct least common multiple, instead of calling max()
|
|
template <class T, class... Ts>
|
|
__host__ __device__ constexpr T lcm(T x, Ts... xs)
|
|
{
|
|
return max(x, xs...);
|
|
}
|
|
|
|
} // namespace mod_conv
|