From 2a35a5e725db62b9e7f5ba4e210b27d32770f24d Mon Sep 17 00:00:00 2001 From: zjing14 Date: Tue, 2 May 2023 10:30:23 -0500 Subject: [PATCH] fixed init range (#691) [ROCm/composable_kernel commit: f53ede26e5cb58cb90d9c6c96dafc9a61d1dccc8] --- profiler/include/profiler/profile_gemm_splitk_impl.hpp | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/profiler/include/profiler/profile_gemm_splitk_impl.hpp b/profiler/include/profiler/profile_gemm_splitk_impl.hpp index 233fb15c0a..4cc62509d7 100644 --- a/profiler/include/profiler/profile_gemm_splitk_impl.hpp +++ b/profiler/include/profiler/profile_gemm_splitk_impl.hpp @@ -72,8 +72,8 @@ bool profile_gemm_splitk_impl(int do_verification, { case 0: break; case 1: - a_m_k.GenerateTensorValue(GeneratorTensor_2{0, 1}); - b_k_n.GenerateTensorValue(GeneratorTensor_2{-1, 1}); + a_m_k.GenerateTensorValue(GeneratorTensor_2{-1, 2}); + b_k_n.GenerateTensorValue(GeneratorTensor_2{-1, 2}); break; default: a_m_k.GenerateTensorValue(GeneratorTensor_3{0.0, 1.0}); @@ -94,7 +94,7 @@ bool profile_gemm_splitk_impl(int do_verification, a_device_buf.ToDevice(a_m_k.mData.data()); b_device_buf.ToDevice(b_k_n.mData.data()); - c_device_buf.ToDevice(c_m_n_device_result.mData.data()); + c_device_buf.SetZero(); using DeviceOp = ck::tensor_operation::device::DeviceGemmSplitK