Tiny movement in the code lines of the pipeline

This commit is contained in:
Qianfeng Zhang
2025-06-26 10:09:51 +00:00
parent 60d8ffb6cf
commit 3c300d3069

View File

@@ -368,7 +368,9 @@ struct HstuAttentionFwdPipelineQRKSVS
move_tile_window(v_dram_window, {0, kK1});
__builtin_amdgcn_sched_barrier(0);
// for i_k1 = k1_loop-1, the loading is for next iteration
k_tile = load_tile(k_dram_window);
move_tile_window(k_dram_window, {kK1, 0});
block_sync_lds();
// execute current unroll of gemm_0
@@ -395,14 +397,6 @@ struct HstuAttentionFwdPipelineQRKSVS
tile_elementwise_inout([&scale_s](auto& x) { x = x * scale_s; }, sacc_tile);
}
__builtin_amdgcn_sched_barrier(0);
// for i_k1 = k1_loop-1, the loading is for next iteration
k_tile = load_tile(k_dram_window);
move_tile_window(k_dram_window, {kK1, 0});
__builtin_amdgcn_sched_barrier(0);
if constexpr(HstuMask::IsMasking)
{
if constexpr(HstuMask::kUseLocal)