fix

2026-05-11 00:10:09 +00:00 · 2024-08-25 14:44:01 -07:00
parent 13d6f8ed90
commit 868f662eb6
1 changed files with 1 additions and 0 deletions
--- a/packages_3rdparty/gguf/quants.py
+++ b/packages_3rdparty/gguf/quants.py
@@ -609,6 +609,7 @@ class Q8_0(__Quant, qtype=GGMLQuantizationType.Q8_0):
    def bake_layer_weight(cls, layer, weight):
        blocks = weight.data
        d, x = quick_split(blocks, [2])
+        x = x.view(torch.int8)
        d = d.view(torch.float16).to(cls.computation_dtype)
        weight.data = x
        layer.quant_state_0 = torch.nn.Parameter(d, requires_grad=False)