From 868f662eb69add3931e36d679133421683f59c3f Mon Sep 17 00:00:00 2001 From: layerdiffusion <19834515+lllyasviel@users.noreply.github.com> Date: Sun, 25 Aug 2024 14:44:01 -0700 Subject: [PATCH] fix --- packages_3rdparty/gguf/quants.py | 1 + 1 file changed, 1 insertion(+) diff --git a/packages_3rdparty/gguf/quants.py b/packages_3rdparty/gguf/quants.py index 84083da9..dcea8f5a 100644 --- a/packages_3rdparty/gguf/quants.py +++ b/packages_3rdparty/gguf/quants.py @@ -609,6 +609,7 @@ class Q8_0(__Quant, qtype=GGMLQuantizationType.Q8_0): def bake_layer_weight(cls, layer, weight): blocks = weight.data d, x = quick_split(blocks, [2]) + x = x.view(torch.int8) d = d.view(torch.float16).to(cls.computation_dtype) weight.data = x layer.quant_state_0 = torch.nn.Parameter(d, requires_grad=False)