iq4_knn: Basics + CUDA

This commit is contained in:
Iwan Kawrakow
2024-10-16 18:37:47 +03:00
parent 03cabe1540
commit ebb5eb0fc8
15 changed files with 449 additions and 4 deletions

View File

@@ -181,6 +181,7 @@ extern "C" {
LLAMA_FTYPE_MOSTLY_IQ3_KL = 146, // except 1d tensors
LLAMA_FTYPE_MOSTLY_IQ2_KS = 147, // except 1d tensors
LLAMA_FTYPE_MOSTLY_IQ4_KSS = 148, // except 1d tensors
LLAMA_FTYPE_MOSTLY_IQ4_KNN = 149, // except 1d tensors
LLAMA_FTYPE_GUESSED = 1024, // not specified in the model file
};