From 005674cecc95b00a9f42ae5a484be2e9b38e93c1 Mon Sep 17 00:00:00 2001 From: Kawrakow Date: Mon, 22 Jul 2024 12:28:18 +0200 Subject: [PATCH] Fix "make it work for row sizes that are multiple of 4 on NEON" --- iqk_mul_mat.cpp | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/iqk_mul_mat.cpp b/iqk_mul_mat.cpp index 45d7816b..c83d2d84 100644 --- a/iqk_mul_mat.cpp +++ b/iqk_mul_mat.cpp @@ -4231,7 +4231,7 @@ template struct QF16 final : public QF16Base { for (int iy = 0; iy < nrc_y; ++iy) y[iy] = (const __fp16 *)(cx + iy*bx); } IQK_ALWAYS_INLINE Data load1(int iy, int i) const { return load(y[iy] + k_step*i); } - IQK_ALWAYS_INLINE Data load_tail(int iy, int i) const { return load4(y[iy] + k_step*i); } + IQK_ALWAYS_INLINE Data load_tail(int iy, int i) const { return load4(y[iy] + 4*i); } const __fp16 * y[nrc_y]; };