From 9b0d87fe9ac1f5700f1cecaa7046ab2c4f23d21a Mon Sep 17 00:00:00 2001 From: Qianfeng Date: Thu, 13 Jun 2024 16:12:20 +0800 Subject: [PATCH] Fix to the using of static_for in amd_buffer_addressing.hpp (#1337) * Add insert_dummy_dep_per_dword over-loading for length 64 * Fix insert_dummy_dep_per_dword and remove over-loading for length 64 * Remove blank lines --------- Co-authored-by: Po Yen Chen [ROCm/composable_kernel commit: 37a347e3807198400d6ee1c8401f7c2cbb1d426e] --- include/ck_tile/core/arch/amd_buffer_addressing.hpp | 5 +++-- 1 file changed, 3 insertions(+), 2 deletions(-) diff --git a/include/ck_tile/core/arch/amd_buffer_addressing.hpp b/include/ck_tile/core/arch/amd_buffer_addressing.hpp index 9c6e85f013..13e92ef0bb 100644 --- a/include/ck_tile/core/arch/amd_buffer_addressing.hpp +++ b/include/ck_tile/core/arch/amd_buffer_addressing.hpp @@ -552,8 +552,9 @@ namespace impl{ template CK_TILE_DEVICE void insert_dummy_dep_per_dword(array& b) { - static_for<0, b.size(), 1>{}([&](auto i){ - asm volatile(" " : : "v"(b.get(i)) : "memory"); + constexpr auto kSize = remove_cvref_t::size(); + static_for<0, kSize, 1>{}([&](auto i){ + asm volatile(" " : : "v"(b.get(number{})) : "memory"); }); } #if 1