ling

2026-05-11 00:10:09 +00:00 · 2024-08-15 00:39:12 -07:00
parent 0524133714
commit 7fcfb93090
1 changed files with 4 additions and 8 deletions
--- a/backend/operations_gguf.py
+++ b/backend/operations_gguf.py
@@ -45,14 +45,6 @@ def dequantize(data, qtype, oshape):
    return blocks.reshape(oshape)


-def to_uint32(x):
-    # (c) City96 || Apache-2.0 (apache.org/licenses/LICENSE-2.0)
-
-    # no uint32 :(
-    x = x.view(torch.uint8).to(torch.int32)
-    return (x[:, 0] | x[:, 1] << 8 | x[:, 2] << 16 | x[:, 3] << 24).unsqueeze(1)
-
-
 def dequantize_blocks_Q8_0(blocks, block_size, type_size):
    # (c) City96 || Apache-2.0 (apache.org/licenses/LICENSE-2.0)

@@ -64,6 +56,10 @@ def dequantize_blocks_Q8_0(blocks, block_size, type_size):
 def dequantize_blocks_Q5_0(blocks, block_size, type_size):
    # (c) City96 || Apache-2.0 (apache.org/licenses/LICENSE-2.0)

+    def to_uint32(x):
+        x = x.view(torch.uint8).to(torch.int32)
+        return (x[:, 0] | x[:, 1] << 8 | x[:, 2] << 16 | x[:, 3] << 24).unsqueeze(1)
+
    n_blocks = blocks.shape[0]

    d = blocks[:, :2]