mirror of
https://github.com/ikawrakow/ik_llama.cpp.git
synced 2026-04-26 17:39:37 +00:00
Fix q6_0 K cache
This commit is contained in:
@@ -2690,7 +2690,7 @@ inline std::pair<mul_mat_t, int> mul_mat_kernel(int int_typeA, int nq) {
|
||||
MAKE_FUNCS_ONLY_NRC(mul_mat_q8_0_r8_q8_2, nq);
|
||||
#endif
|
||||
}
|
||||
else if (typeA == GGML_TYPE_Q8_0) {
|
||||
else if (typeA == GGML_TYPE_Q6_0) {
|
||||
#ifdef __aarch64__
|
||||
MAKE_FUNCS(mul_mat_qX_0_q8_0<DequantizerQ60, nq);
|
||||
#else
|
||||
|
||||
Reference in New Issue
Block a user