Adding fused mul+multi_add + CPU implementation

This commit is contained in:
Iwan Kawrakow
2025-10-23 10:23:59 +03:00
parent db3ba4999f
commit c9b80b2665

View File

@@ -949,6 +949,7 @@ llm_expert_gating_func_type gating_op,
}
experts = ggml_mul(ctx, experts, weights);
cb(experts, "ffn_moe_weighted", il);
return experts;
}
if (n_expert_used == 1) {