mirror of
https://github.com/ROCm/composable_kernel.git
synced 2026-05-13 17:55:48 +00:00
Update to GetNumPrefetchV() for kM0=64 path
This commit is contained in:
@@ -32,9 +32,18 @@ struct BlockFmhaPipelineQRKSVSWholeKPrefetchDefaultPolicy
|
||||
|
||||
if constexpr(Problem::kUseTrLoad)
|
||||
{
|
||||
if constexpr(n0_loops >= 4 && k1_loops >= 6)
|
||||
return 3;
|
||||
return 2;
|
||||
// kM0 is 64, kN0 is 128, prefetch all k_tiles
|
||||
if constexpr(IsPreloadWholeNextIterationK<Problem>())
|
||||
{
|
||||
if constexpr(n0_loops >= 4 && k1_loops >= 6)
|
||||
return 2;
|
||||
return 2;
|
||||
}
|
||||
else // kM0 is 128, kN0 is 64, prefetch one k_tile
|
||||
{
|
||||
// kN0 == 64, try to prefetch more v_tiles
|
||||
return 2;
|
||||
};
|
||||
}
|
||||
else
|
||||
{
|
||||
|
||||
Reference in New Issue
Block a user