From d5e758047311febc3e9e5495c1fdf405e9f4b40c Mon Sep 17 00:00:00 2001 From: "Lin, Qun" Date: Sun, 25 May 2025 02:13:15 -0500 Subject: [PATCH] correct a typo in tail --- ...wise_gemm_pipeline_xdlops_v3_mx_bpreshuffle.hpp | 14 +++++++------- 1 file changed, 7 insertions(+), 7 deletions(-) diff --git a/include/ck/tensor_operation/gpu/block/blockwise_gemm_pipeline_xdlops_v3_mx_bpreshuffle.hpp b/include/ck/tensor_operation/gpu/block/blockwise_gemm_pipeline_xdlops_v3_mx_bpreshuffle.hpp index 357b91373b..40ce308f22 100644 --- a/include/ck/tensor_operation/gpu/block/blockwise_gemm_pipeline_xdlops_v3_mx_bpreshuffle.hpp +++ b/include/ck/tensor_operation/gpu/block/blockwise_gemm_pipeline_xdlops_v3_mx_bpreshuffle.hpp @@ -450,7 +450,7 @@ struct BlockwiseGemmXdlops_pipeline_v3_mx_bprehuffle LocalPrefetchStages ? MRepeat/ MXdlPack - LocalPrefetchStages : 0; // main body if constexpr(HasMainLoop) { @@ -516,7 +516,7 @@ struct BlockwiseGemmXdlops_pipeline_v3_mx_bprehuffle{}([&](auto m0) { - if constexpr(m0.value == (MRepeat/ MXdlPack - LocalPrefetchStages)) + if constexpr(m0.value == SwitchM) { block_sync_lds(); a_blockwise_copy.Run(a_grid_desc, a_grid_buf, a_block_desc, a_block_bufs(scale_comp_buf)); @@ -524,7 +524,7 @@ struct BlockwiseGemmXdlops_pipeline_v3_mx_bprehuffle= (MRepeat/ MXdlPack - LocalPrefetchStages) + m0.value >= SwitchM ? scale_mem_buf : scale_comp_buf; @@ -778,14 +778,14 @@ struct BlockwiseGemmXdlops_pipeline_v3_mx_bprehuffle= (MRepeat - LocalPrefetchStages * MXdlPack) / MXdlPack ? I1 : I0; + m0.value >= SwitchM ? I1 : I0; static_for<0, KRepeat, 1>{}([&](auto k) { static_for<0, MXdlPack, 1>{}([&](auto imxdl) { @@ -893,7 +893,7 @@ struct BlockwiseGemmXdlops_pipeline_v3_mx_bprehuffle{}([&](auto k) { static_for<0, MXdlPack, 1>{}([&](auto imxdl) { @@ -1058,7 +1058,7 @@ struct BlockwiseGemmXdlops_pipeline_v3_mx_bprehuffle{}([&](auto k) { static_for<0, MXdlPack, 1>{}([&](auto imxdl) {