updated bfloat16_to_float

[ROCm/composable_kernel commit: 89e1ebd4d5]
2026-05-16 10:59:55 +00:00 · 2021-11-16 18:01:25 +00:00
parent 456f5306df
commit ea6fa92eea
8 changed files with 93 additions and 165 deletions
--- a/host/host_tensor/include/host_tensor.hpp
+++ b/host/host_tensor/include/host_tensor.hpp
@@ -321,18 +321,14 @@ void check_error(const Tensor<T>& ref, const Tensor<T>& result)
    std::cout << "max_diff: " << max_diff << ", " << ref_value << ", " << result_value << std::endl;
 }

-float bf16_to_f32(ushort src_val)
+__host__ __device__ float bf16_to_f32(ushort src_val)
 {
-    typedef union
+    union
    {
-        ushort x, y;
-        float f32;
-    } bf16_f32_t;
-
-    bf16_f32_t v;
-    v.x = 0;
-    v.y = src_val;
-    return v.f32;
+        uint32_t int32;
+        float fp32;
+    } u = {uint32_t(src_val) << 16};
+    return u.fp32;
 }

 template <>
@@ -354,8 +350,7 @@ void check_error<ushort>(const Tensor<ushort>& ref, const Tensor<ushort>& result
    }

    std::cout << "error: " << error << std::endl;
-    std::cout << "max_diff: " << max_diff << ", ref: " << ref_value << ", res: " << result_value
-              << std::endl;
+    std::cout << "max_diff: " << max_diff << ", " << ref_value << ", " << result_value << std::endl;
 }

 #endif