mirror of
https://github.com/amd/blis.git
synced 2026-05-11 17:50:00 +00:00
Fix in DTRSM Small MT
Details: 1. Changes are made in dtrsm small MT path,to avoid accuracy issues. AMD-Internal: [SWLCSG-1470] Change-Id: I65237225892f97b7222fe71f66b02841b5956560
This commit is contained in:
committed by
Satish Kumar Nuggu
parent
2cdeea3c66
commit
b7bc5f204f
@@ -967,40 +967,6 @@ void dtrsm_blis_impl
|
||||
return;
|
||||
}
|
||||
}
|
||||
|
||||
// bli_trsm_small_mt is performing better than native multithread
|
||||
// for certain sizes of m & n.
|
||||
#ifdef BLIS_ENABLE_OPENMP
|
||||
rntm_t rntm;
|
||||
bli_rntm_init_from_global( &rntm );
|
||||
|
||||
// Query the total number of threads from the rntm_t object.
|
||||
dim_t n_threads = bli_rntm_num_threads( &rntm );
|
||||
if ( ( (n_threads > 1) && (m0 <= 1500) && (n0 <= 1500) ) ||
|
||||
( (n_threads == 32) && (m0 <= 2300) && (n0 <= 2300) ) ||
|
||||
( (n_threads == 16) && (m0 <= 3800) && (n0 <= 3800) ) ||
|
||||
( (n_threads == 8) && (m0 <= 2800) && (n0 <= 2800) ) ||
|
||||
( (n_threads == 4) && (m0 <= 2000) && (n0 <= 2000) ) ||
|
||||
( (n_threads == 2) && (m0 <= 2000) && (n0 <= 2000) ) )
|
||||
{
|
||||
err_t status;
|
||||
status = bli_trsm_small_mt(
|
||||
blis_side,
|
||||
&alphao,
|
||||
&ao,
|
||||
&bo,
|
||||
NULL,
|
||||
NULL);
|
||||
|
||||
if ( status == BLIS_SUCCESS )
|
||||
{
|
||||
AOCL_DTL_TRACE_EXIT(AOCL_DTL_LEVEL_INFO);
|
||||
/* Finalize BLIS. */
|
||||
bli_finalize_auto();
|
||||
return;
|
||||
}
|
||||
}
|
||||
#endif// BLIS_ENABLE_OPENMP
|
||||
} // bli_cpuid_is_avx_supported
|
||||
#endif// END of BLIS_ENABLE_SMALL_MATRIX_TRSM
|
||||
|
||||
|
||||
Reference in New Issue
Block a user