diff --git a/ggml/src/iqk/fa/iqk_fa_templates.h b/ggml/src/iqk/fa/iqk_fa_templates.h index b11c2989..481515cb 100644 --- a/ggml/src/iqk/fa/iqk_fa_templates.h +++ b/ggml/src/iqk/fa/iqk_fa_templates.h @@ -226,7 +226,8 @@ struct HelperQ8KV final : public BaseHelper { struct HelperQ80 final : public BaseHelper { using Base = BaseHelper; constexpr static ggml_type type = GGML_TYPE_Q8_0; -#ifdef HAVE_FANCY_SIMD +//#ifdef HAVE_FANCY_SIMD +#ifdef __AVX2__ using block_q8 = block_q8_2; constexpr static int block_size_q = QK8_2; #else diff --git a/ggml/src/iqk/iqk_gemm_legacy_quants.cpp b/ggml/src/iqk/iqk_gemm_legacy_quants.cpp index 9595b4ce..b617606a 100644 --- a/ggml/src/iqk/iqk_gemm_legacy_quants.cpp +++ b/ggml/src/iqk/iqk_gemm_legacy_quants.cpp @@ -3299,9 +3299,12 @@ inline std::pair mul_mat_kernel(int int_typeA, int nq) { if (nq == 4) return std::make_pair(mul_mat_qX_0_q8_2_Tx, 4); MAKE_FUNCS(mul_mat_qX_1_q8_2_T, 1); - if (nq == 2) return std::make_pair(mul_mat_qX_0_q8_0_Tx, 2); - if (nq == 4) return std::make_pair(mul_mat_qX_0_q8_0_Tx, 4); + //if (nq == 1) return std::make_pair(mul_mat_qX_0_q8_0_Tx, 1); + //if (nq == 2) return std::make_pair(mul_mat_qX_0_q8_0_Tx, 2); + //if (nq == 4) return std::make_pair(mul_mat_qX_0_q8_0_Tx, 4); + if (nq == 1) return std::make_pair(mul_mat_qX_0_q8_0_T, 1); + if (nq == 2) return std::make_pair(mul_mat_qX_0_q8_0_T, 2); + if (nq == 4) return std::make_pair(mul_mat_qX_0_q8_0_T, 4); if (nq == 3) return std::make_pair(mul_mat_qX_0_q8_0_T, 3); if (nq == 5) return std::make_pair(mul_mat_qX_0_q8_0_T, 5); if (nq == 6) return std::make_pair(mul_mat_qX_0_q8_0_T, 6);