Merge commit '5d67d82a0bb6dbf5f82f3b4ba2e9188eb838b927' into develop

This commit is contained in:
assistant-librarian[bot]
2025-12-02 11:12:35 +00:00
parent ae8f3a3b19
commit be7c12a132
2 changed files with 506 additions and 410 deletions

View File

@@ -23,7 +23,8 @@ struct BaseGemmPipelineAgBgCrCompV4
CK_TILE_HOST_DEVICE static constexpr bool BlockHasHotloop(index_t num_loop)
{
return num_loop > PrefetchStages;
constexpr index_t HotLoopGlobalReads = 2;
return num_loop >= (HotLoopGlobalReads + PrefetchStages);
}
CK_TILE_HOST_DEVICE static constexpr TailNumber GetBlockLoopTailNum(index_t num_loop)