Slightly better matrix x vector on Zen4/AVX2 for iq2_k_r4, iq3_k_r4, iq4_k_r4 (#148)

* Slightly better matrix x vector on Zen4/AVX2 for iq2_k_r4, iq3_k_r4, iq4_k_r4 More importantly: simplify. * Minor --------- Co-authored-by: Iwan Kawrakow <iwan.kawrakow@gmail.com>
2026-04-29 10:51:51 +00:00 · 2024-12-17 18:55:38 +01:00
parent a648191c2c
commit 2247afa967
2 changed files with 55 additions and 68 deletions
--- a/examples/llama-bench/llama-bench.cpp
+++ b/examples/llama-bench/llama-bench.cpp
@@ -238,7 +238,7 @@ struct cmd_params {
    int reps;
    bool verbose;
    bool warmup;
-    bool repack;
+    bool repack = false;
    output_formats output_format;
    output_formats output_format_stderr;
 };
@@ -632,7 +632,7 @@ struct cmd_params_instance {
    std::vector<float> tensor_split;
    bool use_mmap;
    bool embeddings;
-    bool repack;
+    bool repack = false;

    llama_model_params to_llama_mparams() const {
        llama_model_params mparams = llama_model_default_params();
@@ -811,7 +811,7 @@ struct test {
    std::vector<float> tensor_split;
    bool use_mmap;
    bool embeddings;
-    bool repack;
+    bool repack = false;
    int n_prompt;
    int n_gen;
    std::string test_time;