iq6_k: WIP (quantize/dequantize)

2026-04-29 10:51:51 +00:00 · 2024-08-07 16:49:43 +03:00
parent 54ce23bb61
commit 85f448e2b1
5 changed files with 150 additions and 119 deletions
--- a/include/llama.h
+++ b/include/llama.h
@@ -174,7 +174,8 @@ extern "C" {
        LLAMA_FTYPE_MOSTLY_IQ3_K         = 39, // except 1d tensors
        LLAMA_FTYPE_MOSTLY_IQ4_K         = 40, // except 1d tensors
        LLAMA_FTYPE_MOSTLY_IQ5_K         = 41, // except 1d tensors
-        LLAMA_FTYPE_MOSTLY_IQ2_TN        = 42, // except 1d tensors
+        LLAMA_FTYPE_MOSTLY_IQ6_K         = 42, // except 1d tensors
+        LLAMA_FTYPE_MOSTLY_IQ2_TN        = 43, // except 1d tensors

        LLAMA_FTYPE_GUESSED = 1024, // not specified in the model file
    };