From 0317ba5a015113b716236e328294df4e099d8a25 Mon Sep 17 00:00:00 2001 From: Iwan Kawrakow Date: Wed, 9 Oct 2024 18:09:35 +0300 Subject: [PATCH] iq3_ks: Fix CUDA dot product --- ggml/src/ggml-cuda/iqk_mmvq.cu | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/ggml/src/ggml-cuda/iqk_mmvq.cu b/ggml/src/ggml-cuda/iqk_mmvq.cu index 0dc82319..e3250f00 100644 --- a/ggml/src/ggml-cuda/iqk_mmvq.cu +++ b/ggml/src/ggml-cuda/iqk_mmvq.cu @@ -559,9 +559,9 @@ __device__ __forceinline__ float vec_dot_iq3_ks_q8_1( const int hshift = 4*(1-ib128); const uint16_t * values1 = iq3k_table + ((bq3->scales[4*ib128+0] << 6) & 0x40); - const uint16_t * values2 = iq3k_table + ((bq3->scales[4*ib128+0] << 6) & 0x40); - const uint16_t * values3 = iq3k_table + ((bq3->scales[4*ib128+0] << 6) & 0x40); - const uint16_t * values4 = iq3k_table + ((bq3->scales[4*ib128+0] << 6) & 0x40); + const uint16_t * values2 = iq3k_table + ((bq3->scales[4*ib128+1] << 6) & 0x40); + const uint16_t * values3 = iq3k_table + ((bq3->scales[4*ib128+2] << 6) & 0x40); + const uint16_t * values4 = iq3k_table + ((bq3->scales[4*ib128+3] << 6) & 0x40); const int * q8; int sumi[4] = {0, 0, 0, 0};