GEMM Multiply Multiply Fix (#2102)

* fix the type convert and increase the BF16 conversion + the profile comment

* fix the CI

[ROCm/composable_kernel commit: 0cca8fa28f]
This commit is contained in:
Thomas Ning
2025-04-22 01:13:22 -07:00
committed by GitHub
parent 7e42b9a814
commit 79b01b0824
2 changed files with 2 additions and 2 deletions

View File

@@ -117,7 +117,7 @@ inline __host__ __device__ constexpr bhalf_t type_convert<bhalf_t, float>(float
#if CK_USE_RNE_BF16_CONVERSION
return bf16_convert_rtn<bhalf_t>(x);
#else
return uint16_t(uint32_t{x} >> 16);
return uint16_t(static_cast<uint32_t>(x) >> 16);
#endif
}