Fixed bug introduced by bugfix in 25b258d.

Details:
- We actually need to check alignment of lda*sizeof(double) and NOT
  a+lda because in the latter case, alignment could cancel out and
  still allow the optimized code to run when it shouldn't. Thanks
  to Devin for pointing this out.
This commit is contained in:
Field G. Van Zee
2014-09-18 10:24:20 -05:00
parent 25b258d61f
commit e80a453784
3 changed files with 3 additions and 3 deletions

View File

@@ -92,7 +92,7 @@ void bli_daxpyf_opt_var1(
use_ref = TRUE;
}
else if ( inca != 1 || incx != 1 || incy != 1 ||
bli_is_unaligned_to( a+lda, 16 ) )
bli_is_unaligned_to( lda*sizeof(double), 16 ) )
{
use_ref = TRUE;
}

View File

@@ -116,7 +116,7 @@ void bli_ddotxaxpyf_opt_var1( conj_t conjat,
use_ref = TRUE;
}
else if ( inca != 1 || incw != 1 || incx != 1 || incy != 1 || incz != 1 ||
bli_is_unaligned_to( a+lda, 16 ) )
bli_is_unaligned_to( lda*sizeof(double), 16 ) )
{
use_ref = TRUE;
}

View File

@@ -104,7 +104,7 @@ void bli_ddotxf_opt_var1(
use_ref = TRUE;
}
else if ( inca != 1 || incx != 1 || incy != 1 ||
bli_is_unaligned_to( a+lda, 16 ) )
bli_is_unaligned_to( lda*sizeof(double), 16 ) )
{
use_ref = TRUE;
}