Eliminate warning caused by failed to meet occupancy requirement (#2389)

Co-authored-by: felix <felix.li@amd.com>
This commit is contained in:
Po Yen Chen
2025-07-08 09:17:25 +08:00
committed by GitHub
parent f240ae3248
commit b2dea90116

View File

@@ -122,6 +122,9 @@ struct BlockFmhaBatchPrefillPipelineQRKSVSAsync
{
if constexpr(kPadSeqLenK && BiasEnum == BlockAttentionBiasEnum::ELEMENTWISE_BIAS)
return 1;
// use larger K/V LDS buffer size will lower the occupancy
else if constexpr(64 <= kK0 || 64 <= kK1)
return 1;
else
return 2;
}