From 3fa44df1c283625da7e919a000ccbfd4d0091b1e Mon Sep 17 00:00:00 2001 From: ozturkosu Date: Fri, 13 Jun 2025 05:49:43 -0400 Subject: [PATCH] update in profiler --- .../profile_gemm_universal_streamk_impl.hpp | 15 +++++++++++++-- 1 file changed, 13 insertions(+), 2 deletions(-) diff --git a/profiler/include/profiler/profile_gemm_universal_streamk_impl.hpp b/profiler/include/profiler/profile_gemm_universal_streamk_impl.hpp index bea3492233..c0d486a63a 100755 --- a/profiler/include/profiler/profile_gemm_universal_streamk_impl.hpp +++ b/profiler/include/profiler/profile_gemm_universal_streamk_impl.hpp @@ -250,8 +250,19 @@ bool profile_gemm_universal_streamk_impl(int do_verification, float gb_per_sec = num_btype / 1.E6 / ave_time; - const auto actual_launch_grid_dims = argument_ptr->GetLaunchGridDims(); - + // const auto actual_launch_grid_dims = argument_ptr->GetLaunchGridDims(); + const auto* typed_argument_ptr = dynamic_cast::Argument*>(argument_ptr); + if (typed_argument_ptr) + { + const auto actual_launch_grid_dims = typed_argument_ptr->GetLaunchGridDims(); + std::cout << "Actual Grid Dimensions: " << actual_launch_grid_dims.x << "x" + << actual_launch_grid_dims.y << "x" << actual_launch_grid_dims.z << std::endl; + } + else + { + std::cerr << "Error: Failed to cast argument_ptr to the correct type." << std::endl; + } + std::cout << "Perf: " << std::setw(10) << ave_time << " ms, " << tflops << " TFlops, " << gb_per_sec << " GB/s, " << op_name << ", Grid_size " << actual_launch_grid_dims.x // Use the x-dimension of the actual launch grid