mirror of
https://github.com/ikawrakow/ik_llama.cpp.git
synced 2026-04-30 11:21:56 +00:00
Fix more Q8_0 repacking mess on AVX2 (#719)
Co-authored-by: Iwan Kawrakow <iwan.kawrakow@gmail.com>
This commit is contained in:
@@ -502,10 +502,8 @@ extern "C" IQK_API bool iqk_mul_mat(long Nx, long Ny, long ne00,
|
|||||||
MulMat mm;
|
MulMat mm;
|
||||||
|
|
||||||
auto etypeA = ggml_type(typeA);
|
auto etypeA = ggml_type(typeA);
|
||||||
if (auto dequant_type = MulMat::is_dequant_better(etypeA, Ny); dequant_type != etypeA) {
|
if (auto dequant_type = MulMat::is_dequant_better(etypeA, Ny);
|
||||||
if (!MulMat::prepare(dequant_type, typeB, ne00, mm, Ny)) {
|
dequant_type != etypeA && MulMat::prepare(dequant_type, typeB, ne00, mm, Ny)) {
|
||||||
return false;
|
|
||||||
}
|
|
||||||
|
|
||||||
constexpr int k_x_step = 32;
|
constexpr int k_x_step = 32;
|
||||||
|
|
||||||
|
|||||||
Reference in New Issue
Block a user