add hunyuan moe support for 561 (#565)

* add hunyuan moe * Don't reshape Vcur * Apply chat template fix from mainline PR14584
2026-01-26 17:20:01 +00:00 · 2025-07-09 04:29:40 -04:00
parent 6a56d5075d
commit db49223e8c
3 changed files with 258 additions and 0 deletions
--- a/include/llama.h
+++ b/include/llama.h
@@ -111,6 +111,7 @@ extern "C" {
        LLAMA_VOCAB_PRE_TYPE_FALCON_3       = 34,
        LLAMA_VOCAB_PRE_TYPE_FALCON_E       = 35,
        LLAMA_VOCAB_PRE_TYPE_SEED_CODER     = 36, //llama.cpp lists this as 35
+        LLAMA_VOCAB_PRE_TYPE_HUNYUAN        = 37, //llama.cpp lists this as 36
    };

    // note: these values should be synchronized with ggml_rope