From 8fd889dcad5c6c39ebcaa0202560843193745f6c Mon Sep 17 00:00:00 2001 From: layerdiffusion <19834515+lllyasviel@users.noreply.github.com> Date: Tue, 20 Aug 2024 08:04:09 -0700 Subject: [PATCH] fix #1336 --- packages_3rdparty/gguf/quants.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/packages_3rdparty/gguf/quants.py b/packages_3rdparty/gguf/quants.py index 4360bfeb..c6c80c91 100644 --- a/packages_3rdparty/gguf/quants.py +++ b/packages_3rdparty/gguf/quants.py @@ -805,7 +805,7 @@ class Q5_K(__Quant, qtype=GGMLQuantizationType.Q5_K): d, dmin, scales, qh, qs = quick_split(blocks, [2, 2, K_SCALE_SIZE, QK_K // 8]) d = d.view(torch.float16) dmin = dmin.view(torch.float16) - sc, m = Q4_K.get_scale_min(scales) + sc, m = Q4_K.get_scale_min_pytorch(scales) d = (d * sc).reshape((n_blocks, -1, 1)) dm = (dmin * m).reshape((n_blocks, -1, 1)) ql = qs.reshape((n_blocks, -1, 1, 32)) >> torch.tensor([0, 4], device=d.device, dtype=torch.uint8).reshape((1, 1, 2, 1))