mirror of
https://github.com/ikawrakow/ik_llama.cpp.git
synced 2026-03-06 03:50:08 +00:00
Disable split mode graph for recurrent/hybrid models when tensor overrides (#1366)
This commit is contained in:
@@ -1981,6 +1981,14 @@ static bool llm_load_tensors(
|
||||
LLAMA_LOG_WARN("================================================================\n\n");
|
||||
max_gpu = 4;
|
||||
}
|
||||
else if (llama_model_has_recurrent(&model) && model.has_tensor_overrides()) {
|
||||
LLAMA_LOG_WARN("\n================================================================\n");
|
||||
LLAMA_LOG_WARN("Split mode 'graph' for recurrent/hybrid models is currently\n");
|
||||
LLAMA_LOG_WARN("disabled when using tensor overrides\n");
|
||||
LLAMA_LOG_WARN(" => changing split mode to 'layer'\n");
|
||||
LLAMA_LOG_WARN("=======================================================\n\n");
|
||||
split_mode = LLAMA_SPLIT_MODE_LAYER;
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
|
||||
Reference in New Issue
Block a user