Use two work-groups per compute-unit for scheduling the kernel

This commit is contained in:
Qianfeng Zhang
2025-06-26 09:46:33 +00:00
parent dc7e62a658
commit 60d8ffb6cf

View File

@@ -91,7 +91,7 @@ struct HstuAttentionFwdPipelineQRKSVS
if constexpr(kHasBias)
return 2;
else
return 3;
return 2;
}
else if constexpr(kQKHeaddim == 256)
{