mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-05-04 05:31:24 +00:00
Hip tensor permute (#1002)
* adding files for F32 example * adding functioning implementation with scalar multiplication and unary operator support * added fp 16 type check in unary square * updating scalar multiplication as an operator * functioning version with scalar operator * changing strides for col major * updated column major implementation * working column major implementation * cleaned up comments, rearranged/renamed files
This commit is contained in:
@@ -355,8 +355,8 @@ struct UnarySquare
|
||||
template <typename T>
|
||||
__host__ __device__ void operator()(T& y, const T& x) const
|
||||
{
|
||||
static_assert(is_same_v<T, float> || is_same_v<T, double> || is_same_v<T, int32_t> ||
|
||||
is_same_v<T, int8_t>
|
||||
static_assert(is_same_v<T, float> || is_same_v<T, half_t> || is_same_v<T, double> ||
|
||||
is_same_v<T, int32_t> || is_same_v<T, int8_t>
|
||||
#ifdef CK_EXPERIMENTAL_BIT_INT_EXTENSION_INT4
|
||||
|| is_same_v<T, int4_t>
|
||||
#endif
|
||||
|
||||
Reference in New Issue
Block a user