Do not apply experts weight scale if it is 1

2026-02-24 15:14:10 +00:00 · 2025-10-20 08:21:21 +03:00
parent 599c812f12
commit acb0bc63fc
1 changed files with 1 additions and 1 deletions
--- a/src/llama-build-context.cpp
+++ b/src/llama-build-context.cpp
@@ -863,7 +863,7 @@ llm_expert_gating_func_type   gating_op,

        weights = ggml_reshape_3d(ctx, weights, 1, n_expert_used, n_tokens);
    }
-    if (scale_w) {
+    if (scale_w && std::abs(w_scale-1) > 1e-5f) {
        weights = ggml_scale(ctx, weights, w_scale);
        cb(weights, "ffn_moe_weights_scaled", il);
    }