mirror of
https://github.com/amd/blis.git
synced 2026-05-24 18:34:40 +00:00
AOCL Dynamic for zen3 dcopy
- Create seperate AOCL Dynamic values for multithreading dcopy API for zen1, zen2 and zen3 AMD-Internal: [CPUPL-5238] Change-Id: I42f56393716edeeace8bfe71d7adab0ba7325b47
This commit is contained in:
@@ -2120,9 +2120,6 @@ BLIS_INLINE void aocl_dcopyv_dynamic
|
||||
break;
|
||||
|
||||
case BLIS_ARCH_ZEN4:
|
||||
case BLIS_ARCH_ZEN:
|
||||
case BLIS_ARCH_ZEN2:
|
||||
case BLIS_ARCH_ZEN3:
|
||||
|
||||
if ( n_elem <= 17000 )
|
||||
*nt_ideal = 1;
|
||||
@@ -2134,6 +2131,18 @@ BLIS_INLINE void aocl_dcopyv_dynamic
|
||||
*nt_ideal = 8;
|
||||
// dcopy does not scale with more than 8 threads
|
||||
break;
|
||||
case BLIS_ARCH_ZEN:
|
||||
case BLIS_ARCH_ZEN2:
|
||||
case BLIS_ARCH_ZEN3:
|
||||
|
||||
if ( n_elem <= 17000 )
|
||||
*nt_ideal = 1;
|
||||
else if (n_elem <= 52200)
|
||||
*nt_ideal = 4;
|
||||
else
|
||||
*nt_ideal = 8;
|
||||
// dcopy does not scale with more than 8 threads
|
||||
break;
|
||||
|
||||
default:
|
||||
// Without this default condition, compiler will throw
|
||||
|
||||
Reference in New Issue
Block a user