mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-04-19 22:39:03 +00:00
Slightly increase tolerance for batchnorm profiler
This commit is contained in:
@@ -430,7 +430,17 @@ bool profile_grouped_conv_fwd_bias_clamp_impl(int do_verification,
|
||||
{
|
||||
out_device_buf.FromDevice(device_output.mData.data());
|
||||
|
||||
pass = pass & ck::utils::check_err(device_output, host_output);
|
||||
if constexpr(std::is_same_v<OutDataType, ck::half_t>)
|
||||
{
|
||||
// The batchnorm involves operations which can cause small numerical
|
||||
// differences between host and device implementations
|
||||
static double rtol = 1e-2;
|
||||
pass = pass & ck::utils::check_err(device_output, host_output, rtol);
|
||||
}
|
||||
else
|
||||
{
|
||||
pass = pass & ck::utils::check_err(device_output, host_output);
|
||||
}
|
||||
|
||||
if(do_log)
|
||||
{
|
||||
|
||||
Reference in New Issue
Block a user