mirror of
https://github.com/amd/blis.git
synced 2026-05-11 09:39:59 +00:00
Fixed bug introduced by bugfix in 25b258d.
Details: - We actually need to check alignment of lda*sizeof(double) and NOT a+lda because in the latter case, alignment could cancel out and still allow the optimized code to run when it shouldn't. Thanks to Devin for pointing this out.
This commit is contained in:
@@ -92,7 +92,7 @@ void bli_daxpyf_opt_var1(
|
||||
use_ref = TRUE;
|
||||
}
|
||||
else if ( inca != 1 || incx != 1 || incy != 1 ||
|
||||
bli_is_unaligned_to( a+lda, 16 ) )
|
||||
bli_is_unaligned_to( lda*sizeof(double), 16 ) )
|
||||
{
|
||||
use_ref = TRUE;
|
||||
}
|
||||
|
||||
@@ -116,7 +116,7 @@ void bli_ddotxaxpyf_opt_var1( conj_t conjat,
|
||||
use_ref = TRUE;
|
||||
}
|
||||
else if ( inca != 1 || incw != 1 || incx != 1 || incy != 1 || incz != 1 ||
|
||||
bli_is_unaligned_to( a+lda, 16 ) )
|
||||
bli_is_unaligned_to( lda*sizeof(double), 16 ) )
|
||||
{
|
||||
use_ref = TRUE;
|
||||
}
|
||||
|
||||
@@ -104,7 +104,7 @@ void bli_ddotxf_opt_var1(
|
||||
use_ref = TRUE;
|
||||
}
|
||||
else if ( inca != 1 || incx != 1 || incy != 1 ||
|
||||
bli_is_unaligned_to( a+lda, 16 ) )
|
||||
bli_is_unaligned_to( lda*sizeof(double), 16 ) )
|
||||
{
|
||||
use_ref = TRUE;
|
||||
}
|
||||
|
||||
Reference in New Issue
Block a user