From 25662974f8ff19a8be8bc013f305cfe3b7b99a8f Mon Sep 17 00:00:00 2001 From: layerdiffusion <19834515+lllyasviel@users.noreply.github.com> Date: Tue, 27 Aug 2024 18:42:00 -0700 Subject: [PATCH] try to test #1502 --- packages_3rdparty/gguf/quants.py | 2 ++ 1 file changed, 2 insertions(+) diff --git a/packages_3rdparty/gguf/quants.py b/packages_3rdparty/gguf/quants.py index c0d144d5..4e013141 100644 --- a/packages_3rdparty/gguf/quants.py +++ b/packages_3rdparty/gguf/quants.py @@ -620,6 +620,8 @@ class Q8_0(__Quant, qtype=GGMLQuantizationType.Q8_0): if d.device != x.device: d = d.to(device=x.device) + x = x.to(cls.computation_dtype) + return x * d @classmethod