From 25b258d61f9c8cee64e922f4131784b6edb196dd Mon Sep 17 00:00:00 2001 From: "Field G. Van Zee" Date: Thu, 18 Sep 2014 10:10:49 -0500 Subject: [PATCH] Fixed a non-fatal problem with bugfix in a68b316c. Details: - The bugfix in a68b316c was inadvertantly checkin alignment of the leading dimension itself, rather than the byte size of the leading dimension. Now, we simply check alignment of a+lda. --- kernels/x86_64/core2-sse3/1f/bli_axpyf_opt_var1.c | 2 +- kernels/x86_64/core2-sse3/1f/bli_dotxaxpyf_opt_var1.c | 2 +- kernels/x86_64/core2-sse3/1f/bli_dotxf_opt_var1.c | 2 +- 3 files changed, 3 insertions(+), 3 deletions(-) diff --git a/kernels/x86_64/core2-sse3/1f/bli_axpyf_opt_var1.c b/kernels/x86_64/core2-sse3/1f/bli_axpyf_opt_var1.c index bdb9ff5ff..da87112a4 100644 --- a/kernels/x86_64/core2-sse3/1f/bli_axpyf_opt_var1.c +++ b/kernels/x86_64/core2-sse3/1f/bli_axpyf_opt_var1.c @@ -92,7 +92,7 @@ void bli_daxpyf_opt_var1( use_ref = TRUE; } else if ( inca != 1 || incx != 1 || incy != 1 || - bli_is_unaligned_to( lda, 16 ) ) + bli_is_unaligned_to( a+lda, 16 ) ) { use_ref = TRUE; } diff --git a/kernels/x86_64/core2-sse3/1f/bli_dotxaxpyf_opt_var1.c b/kernels/x86_64/core2-sse3/1f/bli_dotxaxpyf_opt_var1.c index af21ede35..e5a7fead3 100644 --- a/kernels/x86_64/core2-sse3/1f/bli_dotxaxpyf_opt_var1.c +++ b/kernels/x86_64/core2-sse3/1f/bli_dotxaxpyf_opt_var1.c @@ -116,7 +116,7 @@ void bli_ddotxaxpyf_opt_var1( conj_t conjat, use_ref = TRUE; } else if ( inca != 1 || incw != 1 || incx != 1 || incy != 1 || incz != 1 || - bli_is_unaligned_to( lda, 16 ) ) + bli_is_unaligned_to( a+lda, 16 ) ) { use_ref = TRUE; } diff --git a/kernels/x86_64/core2-sse3/1f/bli_dotxf_opt_var1.c b/kernels/x86_64/core2-sse3/1f/bli_dotxf_opt_var1.c index 741463925..e09e8fe92 100644 --- a/kernels/x86_64/core2-sse3/1f/bli_dotxf_opt_var1.c +++ b/kernels/x86_64/core2-sse3/1f/bli_dotxf_opt_var1.c @@ -104,7 +104,7 @@ void bli_ddotxf_opt_var1( use_ref = TRUE; } else if ( inca != 1 || incx != 1 || incy != 1 || - bli_is_unaligned_to( lda, 16 ) ) + bli_is_unaligned_to( a+lda, 16 ) ) { use_ref = TRUE; }