Added back BLIS_ENABLE_ZEN_BLOCK_SIZES macro to zen configuration, this is same as release 1.3. This was added before to improve DGEMM Multithreaded scalability on Naples for when number of threads is greater than 16. By mistake this got deleted in many changes done for 2.0 release, now we are adding this change back., in bli_gemm_front.c - code clean

Change-Id: I6827b58d2dab1041fe182fef5a007b679ac4bb1f
This commit is contained in:
Kiran Varaganti
2019-05-31 15:14:22 +05:30
committed by Kiran Devrajegowda
parent c4368c66ed
commit ea25ba255a
3 changed files with 3 additions and 8 deletions

View File

@@ -136,6 +136,7 @@ void bli_cntx_init_zen( cntx_t* cntx )
*/
// Zen optmized level 3 cache block sizes
#ifdef BLIS_ENABLE_ZEN_BLOCK_SIZES
#if BLIS_ENABLE_SINGLE_INSTANCE_BLOCK_SIZES
@@ -155,7 +156,7 @@ void bli_cntx_init_zen( cntx_t* cntx )
bli_blksz_init_easy( &blkszs[ BLIS_NC ], 4080, 4080, 4080, 4080 );
#endif
bli_blksz_init_easy( &blkszs[ BLIS_NC ], 4080, 2040, 4080, 4080 );
//bli_blksz_init_easy( &blkszs[ BLIS_NC ], 4080, 2040, 4080, 4080 );
bli_blksz_init_easy( &blkszs[ BLIS_AF ], 8, 8, -1, -1 );
bli_blksz_init_easy( &blkszs[ BLIS_DF ], 8, 8, -1, -1 );

View File

@@ -42,7 +42,7 @@
#define BLIS_DEFAULT_MR_THREAD_MAX 1
#define BLIS_DEFAULT_NR_THREAD_MAX 1
#define BLIS_ENABLE_ZEN_BLOCK_SIZES
#define BLIS_ENABLE_SMALL_MATRIX
#define BLIS_ENABLE_SMALL_MATRIX_TRSM

View File

@@ -52,13 +52,7 @@ void bli_gemm_front
obj_t a_local;
obj_t b_local;
obj_t c_local;
#if 0
gint_t M = bli_obj_length( c );
gint_t N = bli_obj_width( c );
gint_t K = bli_obj_width( a );
if( !(M && N && K)) return;
#endif
#ifdef BLIS_ENABLE_SMALL_MATRIX