mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-05-14 02:02:46 +00:00
[CK_TILE] Fix for comp pipeline v4 (#3307)
* Fix for gemm_pipeline_ag_bg_cr_comp_v4
* Update hotloop condition
Co-authored-by: Bartłomiej Kocot <barkocot@amd.com>
* fix formating
---------
Co-authored-by: Bartłomiej Kocot <barkocot@amd.com>
[ROCm/composable_kernel commit: 5d67d82a0b]
This commit is contained in:
@@ -23,7 +23,8 @@ struct BaseGemmPipelineAgBgCrCompV4
|
||||
|
||||
CK_TILE_HOST_DEVICE static constexpr bool BlockHasHotloop(index_t num_loop)
|
||||
{
|
||||
return num_loop > PrefetchStages;
|
||||
constexpr index_t HotLoopGlobalReads = 2;
|
||||
return num_loop >= (HotLoopGlobalReads + PrefetchStages);
|
||||
}
|
||||
|
||||
CK_TILE_HOST_DEVICE static constexpr TailNumber GetBlockLoopTailNum(index_t num_loop)
|
||||
|
||||
Reference in New Issue
Block a user