mirror of
https://github.com/ikawrakow/ik_llama.cpp.git
synced 2026-04-29 10:51:51 +00:00
iq6_k: WIP (quantize/dequantize)
This commit is contained in:
@@ -174,7 +174,8 @@ extern "C" {
|
||||
LLAMA_FTYPE_MOSTLY_IQ3_K = 39, // except 1d tensors
|
||||
LLAMA_FTYPE_MOSTLY_IQ4_K = 40, // except 1d tensors
|
||||
LLAMA_FTYPE_MOSTLY_IQ5_K = 41, // except 1d tensors
|
||||
LLAMA_FTYPE_MOSTLY_IQ2_TN = 42, // except 1d tensors
|
||||
LLAMA_FTYPE_MOSTLY_IQ6_K = 42, // except 1d tensors
|
||||
LLAMA_FTYPE_MOSTLY_IQ2_TN = 43, // except 1d tensors
|
||||
|
||||
LLAMA_FTYPE_GUESSED = 1024, // not specified in the model file
|
||||
};
|
||||
|
||||
Reference in New Issue
Block a user