Fix regressions

2026-04-20 14:29:28 +00:00 · 2024-11-10 12:58:11 +01:00
parent b28300c0db
commit d37cf7e764
2 changed files with 3 additions and 2 deletions
--- a/examples/chat.py
+++ b/examples/chat.py
@@ -262,7 +262,7 @@ min_space_in_context = args.response_chunk
 # Stop conditions

 sc = prompt_format.stop_conditions(tokenizer)
-sc = [x for x in sc if x]
+sc = [x for x in sc if x is not None]
 generator.set_stop_conditions(sc)

 # ANSI color codes
--- a/exllamav2/architecture.py
+++ b/exllamav2/architecture.py
@@ -401,6 +401,7 @@ class ExLlamaV2ArchParams:
                "mlp_up": ".mlp.c_fc",
                "mlp_down": ".mlp.c_proj",
                "lm_head": "model.embed_tokens",
+                "norm_eps": "layer_norm_epsilon",
            })
            self.lm.mlp_act_func = "gelu"
            self.lm.norm = "layernorm"
@@ -471,9 +472,9 @@ class ExLlamaV2ArchParams:
                "mlp_up": ".block_sparse_moe.experts.*.v1",
                "mlp_down": ".block_sparse_moe.experts.*.w2",
                "mlp_expert_gate": ".block_sparse_moe.gate",
-                "lm_head": "model.embed_tokens",
                "fused_qkv": ".self_attn.Wqkv",
            })
+            self.lm.norm = "layernorm"
            self.lm.is_moe = True

        # Phi3