Re-tuned GEMV thresholds (#210)

Retune DGEMV AVX512 non transpose thresholds to avoid regression on ZEN4.

AMD-Internal: [CPUPL-7448]
This commit is contained in:
Sharma, Shubham
2025-09-19 12:43:50 +05:30
committed by GitHub
parent a9df3fd8d5
commit 773d3a3d45

View File

@@ -1471,7 +1471,7 @@ void bli_dgemv_n_zen4_int (
if ( size < 95000 )
{
// we call sequential GEMV
if ( m <= 180 )
if ( m <= 180 && n >= 8 )
{
ker_ft = bli_dgemv_n_zen4_int_40x2_st;
}
@@ -1494,7 +1494,7 @@ void bli_dgemv_n_zen4_int (
ker_ft = bli_dgemv_m_zen4_int_40x8_mt_Mdiv;
}
#else
if ( m <= 180 )
if ( m <= 180 && n >= 8 )
{
ker_ft = bli_dgemv_n_zen4_int_40x2_st;
}