Merge commit 'c6bfd97c2d186fd03866c3f5d460bb680ce667a1' into develop

This commit is contained in:
assistant-librarian[bot]
2025-09-27 03:19:57 +00:00
parent 088b4670ae
commit 477a605961
5 changed files with 107 additions and 99 deletions

View File

@@ -1,5 +1,5 @@
// SPDX-License-Identifier: MIT
// Copyright (c) 2018-2024, Advanced Micro Devices, Inc. All rights reserved.
// Copyright (c) 2018-2025, Advanced Micro Devices, Inc. All rights reserved.
#pragma once
@@ -223,6 +223,8 @@ struct BlockFmhaFwdSplitKVCombinePipeline
});
}
// sync before rewriting lse_acc_lds
block_sync_lds();
// store the lse scales in shared memory.
{
constexpr auto spans = decltype(lse_accum)::get_distributed_spans();