add hunyuan moe support for 561 (#565)

* add hunyuan moe

* Don't reshape Vcur

* Apply chat template fix from mainline PR14584
This commit is contained in:
ubergarm
2025-07-09 04:29:40 -04:00
committed by GitHub
parent 6a56d5075d
commit db49223e8c
3 changed files with 258 additions and 0 deletions

View File

@@ -111,6 +111,7 @@ extern "C" {
LLAMA_VOCAB_PRE_TYPE_FALCON_3 = 34,
LLAMA_VOCAB_PRE_TYPE_FALCON_E = 35,
LLAMA_VOCAB_PRE_TYPE_SEED_CODER = 36, //llama.cpp lists this as 35
LLAMA_VOCAB_PRE_TYPE_HUNYUAN = 37, //llama.cpp lists this as 36
};
// note: these values should be synchronized with ggml_rope