mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-05-02 20:51:23 +00:00
Fixed f8_gemm NaN (#975)
* workaround nan problem by changing output to fp16 * enable f8/bf8 gemm tests on MI200 * workaround f16 to f8 conversion --------- Co-authored-by: Jing Zhang <jizha@amd.com>
This commit is contained in:
@@ -173,8 +173,7 @@ struct PassThrough
|
||||
template <>
|
||||
__host__ __device__ void operator()<bf8_t, half_t>(bf8_t& y, const half_t& x) const
|
||||
{
|
||||
// to-do: fix half_t to bf8_t convert
|
||||
y = ck::type_convert<bf8_t>(ck::type_convert<float>(x));
|
||||
y = ck::type_convert<bf8_t>(x);
|
||||
}
|
||||
#endif
|
||||
};
|
||||
|
||||
Reference in New Issue
Block a user