BlockSparseMLP: Make sure bias is always applied during calibration

2026-05-11 08:20:05 +00:00 · 2026-03-01 03:13:03 +01:00
parent f7ccb524e7
commit 4bdd22ea77
1 changed files with 2 additions and 0 deletions
--- a/exllamav3/modules/block_sparse_mlp.py
+++ b/exllamav3/modules/block_sparse_mlp.py
@@ -113,6 +113,8 @@ def routing_dots(bsz, cfg, y, params):
        activate_all_experts = params.get("activate_all_experts")
        if activate_all_experts:
            routing_weights = router_logits.sigmoid()
+            if cfg.e_score_correction_bias is not None:
+                routing_weights += cfg.e_score_correction_bias.unsqueeze(0)
            factor = cfg.routed_scaling_factor / (routing_weights.sum(dim = -1, keepdim = True) + 1e-20)
            routing_weights *= factor
            selected_experts = (