From 529dfe7c93426d33d9ce6b0cedb55ff38e095cc5 Mon Sep 17 00:00:00 2001 From: rtmadduri Date: Mon, 2 Dec 2024 00:13:56 -0800 Subject: [PATCH] LWPCK-2429: Device grouped GEMM uses Async Memcpy (#1695) * LWPCK-2429: Device grouped GEMM uses Async Memcpy Resolving merge conflicts * reverting changes to profile_grouped_gemm * revert date change --------- Co-authored-by: Illia Silin <98187287+illsilin@users.noreply.github.com> [ROCm/composable_kernel commit: 9488f1c981cda8515b45952a14e539621150c1f6] --- .../impl/device_grouped_gemm_multiple_d_dl.hpp | 12 ++++++------ ...gemm_multiple_d_splitk_xdl_cshuffle_two_stage.hpp | 10 +++++----- ...rouped_gemm_multiple_d_xdl_cshuffle_tile_loop.hpp | 8 ++++---- .../gpu/device/impl/device_grouped_gemm_xdl.hpp | 12 ++++++------ .../impl/device_grouped_gemm_xdl_splitk_cshuffle.hpp | 10 +++++----- 5 files changed, 26 insertions(+), 26 deletions(-) diff --git a/include/ck/tensor_operation/gpu/device/impl/device_grouped_gemm_multiple_d_dl.hpp b/include/ck/tensor_operation/gpu/device/impl/device_grouped_gemm_multiple_d_dl.hpp index 060a16d1e2..959fc890b8 100644 --- a/include/ck/tensor_operation/gpu/device/impl/device_grouped_gemm_multiple_d_dl.hpp +++ b/include/ck/tensor_operation/gpu/device/impl/device_grouped_gemm_multiple_d_dl.hpp @@ -1,6 +1,6 @@ #pragma once // SPDX-License-Identifier: MIT -// Copyright (c) 2018-2023, Advanced Micro Devices, Inc. All rights reserved. +// Copyright (c) 2018-2024, Advanced Micro Devices, Inc. All rights reserved. #pragma once @@ -603,11 +603,11 @@ struct DeviceGroupedGemmMultipleD_Dl : public DeviceGroupedGemm