Fix q6_0 K cache

This commit is contained in:
Iwan Kawrakow
2025-05-20 10:46:36 +03:00
parent 5351ec0442
commit 0943331ec9

View File

@@ -2690,7 +2690,7 @@ inline std::pair<mul_mat_t, int> mul_mat_kernel(int int_typeA, int nq) {
MAKE_FUNCS_ONLY_NRC(mul_mat_q8_0_r8_q8_2, nq);
#endif
}
else if (typeA == GGML_TYPE_Q8_0) {
else if (typeA == GGML_TYPE_Q6_0) {
#ifdef __aarch64__
MAKE_FUNCS(mul_mat_qX_0_q8_0<DequantizerQ60, nq);
#else