diff --git a/src/llama-build-context.cpp b/src/llama-build-context.cpp index b8c7393d..55ae539f 100644 --- a/src/llama-build-context.cpp +++ b/src/llama-build-context.cpp @@ -949,6 +949,7 @@ llm_expert_gating_func_type gating_op, } experts = ggml_mul(ctx, experts, weights); cb(experts, "ffn_moe_weighted", il); + return experts; } if (n_expert_used == 1) {