Do not use split mode graph scheduling if there are tensor overrides (#1060)

Co-authored-by: Iwan Kawrakow <iwan.kawrakow@gmail.com>
2026-03-13 23:40:09 +00:00 · 2025-12-12 14:48:38 +01:00
parent b3a19a6f37
commit 093cc7c380
1 changed files with 1 additions and 1 deletions
--- a/src/llama.cpp
+++ b/src/llama.cpp
@@ -4771,7 +4771,7 @@ struct llama_context * llama_new_context_with_model(
        LLAMA_LOG_INFO("XXXXXXXXXXXXXXXXXXXXX Setting only active experts offload\n");
        ggml_backend_sched_set_only_active_experts(ctx->sched, true);
    }
-    if (model->split_mode == LLAMA_SPLIT_MODE_GRAPH) {
+    if (model->split_mode == LLAMA_SPLIT_MODE_GRAPH && !model->has_tensor_overrides()) {
        ggml_backend_sched_set_split_mode_graph(ctx->sched, true);
    }