mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-05-24 23:05:54 +00:00
* Turning compare warnings on * Cleaning part I * Cleaning part II * Explicit static_cast to ck::type_convert * Resolving large tensor size issue. * format * revert change to tensor descriptor; promote lementSpaceSize to 64bit * use integer value for GEMM test * Review remarks * Review remarks + issues with (un)signed arithmetic * Format fix * Format * Clang-format. * fix 2gb limit issue Co-authored-by: Chao Liu <chao.liu2@amd.com> Co-authored-by: Adam Osewski <aosewski@amd.com>
20 lines
389 B
C++
20 lines
389 B
C++
#ifndef REDUCE_UTILS_HPP
|
|
#define REDUCE_UTILS_HPP
|
|
|
|
#include "data_type.hpp"
|
|
|
|
namespace ck {
|
|
namespace reduce_util {
|
|
|
|
template <typename T>
|
|
void to_f32_vector(const Tensor<T>& src, Tensor<float>& dst)
|
|
{
|
|
for(std::size_t i = 0; i < src.mData.size(); ++i)
|
|
dst.mData[i] = type_convert<float>(src.mData[i]);
|
|
}
|
|
|
|
} // namespace reduce_util
|
|
|
|
} // namespace ck
|
|
#endif
|