mirror of
https://github.com/turboderp-org/exllamav2.git
synced 2026-03-15 00:07:26 +00:00
Add Qwen3ForCausalLM
This commit is contained in:
@@ -428,6 +428,19 @@ class ExLlamaV2ArchParams:
|
||||
self.lm.attention_bias_qkv = True
|
||||
self.lm.supports_tp = True
|
||||
|
||||
# Qwen3
|
||||
|
||||
if arch_string == "Qwen3ForCausalLM":
|
||||
arch_recognized = True
|
||||
self.lm.layer_keys += \
|
||||
layer_keys_llama_norms + \
|
||||
layer_keys_llama_attn + \
|
||||
layer_keys_llama_mlp
|
||||
self.lm.expect_keys += \
|
||||
expect_keys_llama
|
||||
self.lm.supports_tp = True
|
||||
self.lm.default_use_qk_norm = True
|
||||
|
||||
# Qwen2-VL (2, 2.5)
|
||||
|
||||
if arch_string in ["Qwen2VLForConditionalGeneration", "Qwen2_5_VLForConditionalGeneration"]:
|
||||
|
||||
Reference in New Issue
Block a user