Add all Qwen3.5 model types (#1378)

* Add all Qwen3.5 model types

* Need also this
This commit is contained in:
Kawrakow
2026-03-07 09:01:33 +01:00
committed by GitHub
parent c1c3421462
commit 344688ce50
3 changed files with 10 additions and 3 deletions

View File

@@ -502,8 +502,8 @@ void llm_load_hparams(
}
switch (hparams.n_layer) {
case 28: model.type = e_model::MODEL_80B_A3B; break;
case 48: model.type = e_model::MODEL_80B_A3B; break;
case 40: model.type = e_model::MODEL_35B_A3B; break;
case 48: model.type = e_model::MODEL_122B_A10B; break;
case 60: model.type = e_model::MODEL_397B_A17B; break;
default: model.type = e_model::MODEL_UNKNOWN;
}
@@ -530,7 +530,8 @@ void llm_load_hparams(
}
switch (hparams.n_layer) {
case 24: model.type = e_model::MODEL_2B; break;
case 24: model.type = hparams.n_embd == 1024 ? e_model::MODEL_0_8B : e_model::MODEL_2B; break;
case 32: model.type = hparams.n_embd == 2560 ? e_model::MODEL_4B : e_model::MODEL_9B; break;
case 64: model.type = e_model::MODEL_27B; break;
default: model.type = e_model::MODEL_UNKNOWN;
}

View File

@@ -1681,6 +1681,7 @@ const char * llama_model_type_name(e_model type) {
case MODEL_0_3B: return "0.3B";
case MODEL_0_5B: return "0.5B";
case MODEL_0_6B: return "0.6B";
case MODEL_0_8B: return "0.8B";
case MODEL_1B: return "1B";
case MODEL_1_2B: return "1.2B";
case MODEL_1_3B: return "1.3B";
@@ -1743,10 +1744,12 @@ const char * llama_model_type_name(e_model type) {
case MODEL_16B_A1B: return "16B.A1B";
case MODEL_21B_A3B: return "21B.A3B";
case MODEL_30B_A3B: return "30B.A3B";
case MODEL_35B_A3B: return "35B.A3B";
case MODEL_80B_A3B: return "80B.A3B";
case MODEL_80B_A13B: return "80B.A13B";
case MODEL_100B_A6B: return "100B.A6B";
case MODEL_106B_A12B: return "106B.A12B";
case MODEL_122B_A10B: return "122B.A10B";
case MODEL_230B_A10B: return "230B.A10B";
case MODEL_235B_A22B: return "235B.A22B";
case MODEL_310B_A15B: return "310B.A15B";

View File

@@ -45,6 +45,7 @@ enum e_model {
MODEL_0_3B,
MODEL_0_5B,
MODEL_0_6B,
MODEL_0_8B,
MODEL_1B,
MODEL_1_2B,
MODEL_1_3B,
@@ -107,10 +108,12 @@ enum e_model {
MODEL_16B_A1B,
MODEL_21B_A3B, // Ernie MoE small
MODEL_30B_A3B,
MODEL_35B_A3B,
MODEL_80B_A3B, // Qwen3-Next
MODEL_80B_A13B,
MODEL_100B_A6B,
MODEL_106B_A12B,
MODEL_122B_A10B,
MODEL_230B_A10B, // Minimax M2
MODEL_235B_A22B,
MODEL_310B_A15B,