Rename q4_0_r4, q8_0_r4 and iq4_xs_r4 to _r8 (#189)

* Rename q4_0_r4 to q4_0_r8 to reflect actual row interleaving * Rename q8_0_r4 to q8_0_r8 to reflect actual row interleaving * Rename iq4_xs_r4 to iq4_xs_r8 to reflect actual row interleaving --------- Co-authored-by: Iwan Kawrakow <iwan.kawrakow@gmail.com>
2026-03-04 19:10:03 +00:00 · 2025-02-06 18:45:28 +02:00
parent 7c94c3da56
commit 8049ffcbc8
10 changed files with 196 additions and 196 deletions
--- a/include/llama.h
+++ b/include/llama.h
@@ -181,8 +181,8 @@ extern "C" {
        LLAMA_FTYPE_MOSTLY_IQ2_KS        = 147, // except 1d tensors
        LLAMA_FTYPE_MOSTLY_IQ4_KSS       = 148, // except 1d tensors
                                                //
-        LLAMA_FTYPE_MOSTLY_Q4_0_R4       = 202, // except 1d tensors
-        LLAMA_FTYPE_MOSTLY_Q8_0_R4       = 207, // except 1d tensors
+        LLAMA_FTYPE_MOSTLY_Q4_0_R8       = 202, // except 1d tensors
+        LLAMA_FTYPE_MOSTLY_Q8_0_R8       = 207, // except 1d tensors
        LLAMA_FTYPE_MOSTLY_Q5_0_R4       = 208, // except 1d tensors
        LLAMA_FTYPE_MOSTLY_Q2_K_R4       = 210, // except 1d tensors
        LLAMA_FTYPE_MOSTLY_Q3_K_R4       = 211, // except 1d tensors
@@ -196,7 +196,7 @@ extern "C" {
        LLAMA_FTYPE_MOSTLY_IQ4_NL_R4     = 225, // except 1d tensors
        LLAMA_FTYPE_MOSTLY_IQ3_S_R4      = 226, // except 1d tensors
        LLAMA_FTYPE_MOSTLY_IQ2_M_R4      = 229, // except 1d tensors
-        LLAMA_FTYPE_MOSTLY_IQ4_XS_R4     = 230, // except 1d tensors
+        LLAMA_FTYPE_MOSTLY_IQ4_XS_R8     = 230, // except 1d tensors
        LLAMA_FTYPE_MOSTLY_IQ1_M_R4      = 231, // except 1d tensors
        LLAMA_FTYPE_MOSTLY_Q6_0_R4       = 335, // except 1d tensors
        LLAMA_FTYPE_MOSTLY_BF16_R16      = 232, // except 1d tensors