gguf-py : add IQ1_M to GGML_QUANT_SIZES (#6761)

This commit is contained in:
pmysl
2024-04-21 14:49:30 +02:00
committed by GitHub
parent 7270b7c21b
commit 250586b4a9

View File

@@ -872,6 +872,7 @@ GGML_QUANT_SIZES = {
GGMLQuantizationType.I32: (1, 4),
GGMLQuantizationType.I64: (1, 8),
GGMLQuantizationType.F64: (1, 8),
GGMLQuantizationType.IQ1_M: (256, QK_K // 8 + QK_K // 16 + QK_K // 32),
}