From 34c7c3bbf287e22877016b0b39b0121ae110f044 Mon Sep 17 00:00:00 2001 From: KateJu <153474223+kateju12@users.noreply.github.com> Date: Thu, 23 Apr 2026 14:06:27 +0000 Subject: [PATCH] [rocm-libraries] ROCm/rocm-libraries#6655 (commit 677b38d) Add missing lds sync ## Motivation ## Technical Details ## Test Plan ## Test Result ## Submission Checklist - [ ] Look over the contributing guidelines at https://github.com/ROCm/ROCm/blob/develop/CONTRIBUTING.md#pull-requests. --- .../device/impl/device_grouped_gemm_multi_abd_wmma_fixed_nk.hpp | 1 + .../device/impl/device_grouped_gemm_multi_abd_xdl_fixed_nk.hpp | 1 + 2 files changed, 2 insertions(+) diff --git a/include/ck/tensor_operation/gpu/device/impl/device_grouped_gemm_multi_abd_wmma_fixed_nk.hpp b/include/ck/tensor_operation/gpu/device/impl/device_grouped_gemm_multi_abd_wmma_fixed_nk.hpp index 9532f7e76a..87be350a44 100644 --- a/include/ck/tensor_operation/gpu/device/impl/device_grouped_gemm_multi_abd_wmma_fixed_nk.hpp +++ b/include/ck/tensor_operation/gpu/device/impl/device_grouped_gemm_multi_abd_wmma_fixed_nk.hpp @@ -162,6 +162,7 @@ __launch_bounds__(CK_MAX_THREAD_PER_BLOCK, MinimumOccupancy) id_off += grid_size_grp; id_local += grid_size_grp; + block_sync_lds(); } } #else diff --git a/include/ck/tensor_operation/gpu/device/impl/device_grouped_gemm_multi_abd_xdl_fixed_nk.hpp b/include/ck/tensor_operation/gpu/device/impl/device_grouped_gemm_multi_abd_xdl_fixed_nk.hpp index 9978b62b17..fa33e0fdea 100644 --- a/include/ck/tensor_operation/gpu/device/impl/device_grouped_gemm_multi_abd_xdl_fixed_nk.hpp +++ b/include/ck/tensor_operation/gpu/device/impl/device_grouped_gemm_multi_abd_xdl_fixed_nk.hpp @@ -136,6 +136,7 @@ __launch_bounds__(GridwiseGemm::MaxBlockSize, CK_MIN_BLOCK_PER_CU) id_off += grid_size_grp; id_local += grid_size_grp; + block_sync_lds(); } } #else