Some improvements to trsm parallelism

This commit is contained in:
Tyler Smith
2014-08-20 14:43:17 -05:00
parent daca500db5
commit 699a8151ca
2 changed files with 6 additions and 6 deletions

View File

@@ -83,9 +83,9 @@ void bli_trsm_blk_var2b( obj_t* a,
// Query dimension in partitioning direction.
n_trans = bli_obj_width_after_trans( *b );
dim_t start, end;
bli_get_range_weighted( thread, 0, n_trans,
bli_determine_reg_blocksize( b, cntl_blocksize( cntl ) ),
bli_obj_is_upper( *c ), &start, &end );
bli_get_range( thread, 0, n_trans,
bli_determine_reg_blocksize( b, cntl_blocksize( cntl ) ),
&start, &end );
// Partition along the n dimension.
for ( i = start; i < end; i += b_alg )

View File

@@ -83,9 +83,9 @@ void bli_trsm_blk_var2f( obj_t* a,
// Query dimension in partitioning direction.
n_trans = bli_obj_width_after_trans( *b );
dim_t start, end;
bli_get_range_weighted( thread, 0, n_trans,
bli_determine_reg_blocksize( b, cntl_blocksize( cntl ) ),
bli_obj_is_lower( *c ), &start, &end );
bli_get_range( thread, 0, n_trans,
bli_determine_reg_blocksize( b, cntl_blocksize( cntl ) ),
&start, &end );
// Partition along the n dimension.
for ( i = start; i < end; i += b_alg )