iq5_k_r4: Zen4

Much slower than the others.
This commit is contained in:
Iwan Kawrakow
2024-12-18 09:17:30 +02:00
parent 9b6d14a299
commit 5eac4edc90
10 changed files with 349 additions and 2 deletions

View File

@@ -196,6 +196,7 @@ extern "C" {
LLAMA_FTYPE_MOSTLY_IQ2_K_R4 = 338, // except 1d tensors
LLAMA_FTYPE_MOSTLY_IQ3_K_R4 = 339, // except 1d tensors
LLAMA_FTYPE_MOSTLY_IQ4_K_R4 = 340, // except 1d tensors
LLAMA_FTYPE_MOSTLY_IQ5_K_R4 = 341, // except 1d tensors
LLAMA_FTYPE_MOSTLY_Q8_K_R8 = 399, // except 1d tensors
LLAMA_FTYPE_GUESSED = 1024, // not specified in the model file