fix profiler_grouped_gemm (#1766)

[ROCm/composable_kernel commit: 2944c50894]
This commit is contained in:
Illia Silin
2024-12-19 17:24:05 -08:00
committed by GitHub
parent f501304e4b
commit a4bb0d50ec

View File

@@ -77,7 +77,7 @@ bool profile_grouped_gemm_impl(int do_verification,
std::vector<Tensor<CDataType>> c_m_n_host_results;
std::vector<Tensor<CDataType>> c_m_n_device_results;
ComputeDataType max_abs_in_val = 0.f;
double max_abs_in_val = 0.f;
for(std::size_t i = 0; i < group_count; i++)
{
a_m_k.push_back(