From c9b80b2665b0927280a8dd243363cd1949c5d337 Mon Sep 17 00:00:00 2001 From: Iwan Kawrakow Date: Thu, 23 Oct 2025 10:23:59 +0300 Subject: [PATCH] Adding fused mul+multi_add + CPU implementation --- src/llama-build-context.cpp | 1 + 1 file changed, 1 insertion(+) diff --git a/src/llama-build-context.cpp b/src/llama-build-context.cpp index b8c7393d..55ae539f 100644 --- a/src/llama-build-context.cpp +++ b/src/llama-build-context.cpp @@ -949,6 +949,7 @@ llm_expert_gating_func_type gating_op, } experts = ggml_mul(ctx, experts, weights); cb(experts, "ffn_moe_weighted", il); + return experts; } if (n_expert_used == 1) {