WIP + adding iq3_kl quantization mix

2026-04-28 18:32:04 +00:00 · 2024-10-08 13:56:29 +03:00
parent 4c76471979
commit 1dd6c40c15
11 changed files with 110 additions and 10 deletions
--- a/include/llama.h
+++ b/include/llama.h
@@ -178,6 +178,7 @@ extern "C" {
        LLAMA_FTYPE_MOSTLY_IQ2_TN        = 143, // except 1d tensors
        LLAMA_FTYPE_MOSTLY_IQ1_TN        = 144, // except 1d tensors
        LLAMA_FTYPE_MOSTLY_IQ4_XXS       = 145, // except 1d tensors
+        LLAMA_FTYPE_MOSTLY_IQ3_KL        = 146, // except 1d tensors

        LLAMA_FTYPE_GUESSED = 1024, // not specified in the model file
    };