From b22bdd965de330343a53d89d657f62511c70bfb4 Mon Sep 17 00:00:00 2001 From: Iwan Kawrakow Date: Sun, 15 Jun 2025 08:05:55 +0300 Subject: [PATCH] Fix q8_k_r8 on Zen4 --- ggml/src/iqk/iqk_gemm_kquants.cpp | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/ggml/src/iqk/iqk_gemm_kquants.cpp b/ggml/src/iqk/iqk_gemm_kquants.cpp index ecc17092..c8f3020c 100644 --- a/ggml/src/iqk/iqk_gemm_kquants.cpp +++ b/ggml/src/iqk/iqk_gemm_kquants.cpp @@ -1839,7 +1839,7 @@ static void mul_mat_q8_k_r8_q8_k(int n, const void * vx, size_t bx, const DataIn } } #ifdef HAVE_FANCY_SIMD - auto m4 = _mm256_mul_ps(d4, _mm256_set1_ps(-128.f)); + auto m4 = _mm256_mul_ps(d4, _mm256_set1_ps(-127.f)); #endif for (int iy = 0; iy < nrc_y; ++iy) { auto d4y = _mm256_mul_ps(d4, _mm256_set1_ps(q8.scale(iy, ibl)));