diff --git a/frame/base/bli_rntm.c b/frame/base/bli_rntm.c index 2c7d6019c..d5d86e9fb 100644 --- a/frame/base/bli_rntm.c +++ b/frame/base/bli_rntm.c @@ -2120,9 +2120,6 @@ BLIS_INLINE void aocl_dcopyv_dynamic break; case BLIS_ARCH_ZEN4: - case BLIS_ARCH_ZEN: - case BLIS_ARCH_ZEN2: - case BLIS_ARCH_ZEN3: if ( n_elem <= 17000 ) *nt_ideal = 1; @@ -2134,6 +2131,18 @@ BLIS_INLINE void aocl_dcopyv_dynamic *nt_ideal = 8; // dcopy does not scale with more than 8 threads break; + case BLIS_ARCH_ZEN: + case BLIS_ARCH_ZEN2: + case BLIS_ARCH_ZEN3: + + if ( n_elem <= 17000 ) + *nt_ideal = 1; + else if (n_elem <= 52200) + *nt_ideal = 4; + else + *nt_ideal = 8; + // dcopy does not scale with more than 8 threads + break; default: // Without this default condition, compiler will throw