From 1ef4b5eddc20869a1ad797f3f275d843f4a36fec Mon Sep 17 00:00:00 2001 From: Kawrakow Date: Thu, 5 Mar 2026 10:25:50 +0100 Subject: [PATCH] Disable split mode graph for recurrent/hybrid models when tensor overrides (#1366) --- src/llama.cpp | 8 ++++++++ 1 file changed, 8 insertions(+) diff --git a/src/llama.cpp b/src/llama.cpp index 825800bb..f3daeeed 100644 --- a/src/llama.cpp +++ b/src/llama.cpp @@ -1981,6 +1981,14 @@ static bool llm_load_tensors( LLAMA_LOG_WARN("================================================================\n\n"); max_gpu = 4; } + else if (llama_model_has_recurrent(&model) && model.has_tensor_overrides()) { + LLAMA_LOG_WARN("\n================================================================\n"); + LLAMA_LOG_WARN("Split mode 'graph' for recurrent/hybrid models is currently\n"); + LLAMA_LOG_WARN("disabled when using tensor overrides\n"); + LLAMA_LOG_WARN(" => changing split mode to 'layer'\n"); + LLAMA_LOG_WARN("=======================================================\n\n"); + split_mode = LLAMA_SPLIT_MODE_LAYER; + } } }