mirror of
https://github.com/amd/blis.git
synced 2026-04-19 23:28:52 +00:00
Re-tuned GEMV thresholds (#210)
Retune DGEMV AVX512 non transpose thresholds to avoid regression on ZEN4. AMD-Internal: [CPUPL-7448]
This commit is contained in:
@@ -1471,7 +1471,7 @@ void bli_dgemv_n_zen4_int (
|
||||
if ( size < 95000 )
|
||||
{
|
||||
// we call sequential GEMV
|
||||
if ( m <= 180 )
|
||||
if ( m <= 180 && n >= 8 )
|
||||
{
|
||||
ker_ft = bli_dgemv_n_zen4_int_40x2_st;
|
||||
}
|
||||
@@ -1494,7 +1494,7 @@ void bli_dgemv_n_zen4_int (
|
||||
ker_ft = bli_dgemv_m_zen4_int_40x8_mt_Mdiv;
|
||||
}
|
||||
#else
|
||||
if ( m <= 180 )
|
||||
if ( m <= 180 && n >= 8 )
|
||||
{
|
||||
ker_ft = bli_dgemv_n_zen4_int_40x2_st;
|
||||
}
|
||||
|
||||
Reference in New Issue
Block a user