mirror of
https://github.com/ikawrakow/ik_llama.cpp.git
synced 2026-04-30 11:21:56 +00:00
Set max_gpu to 2 for Mimo2
This commit is contained in:
@@ -1761,6 +1761,13 @@ static bool llm_load_tensors(
|
|||||||
LLAMA_LOG_WARN(" => changing split mode to 'layer'\n");
|
LLAMA_LOG_WARN(" => changing split mode to 'layer'\n");
|
||||||
LLAMA_LOG_WARN("=======================================================\n\n");
|
LLAMA_LOG_WARN("=======================================================\n\n");
|
||||||
split_mode = LLAMA_SPLIT_MODE_LAYER;
|
split_mode = LLAMA_SPLIT_MODE_LAYER;
|
||||||
|
} else {
|
||||||
|
if (model.arch == LLM_ARCH_MIMO2 && model.devices.size() > 2 && max_gpu != 2) {
|
||||||
|
LLAMA_LOG_WARN("\n================================================================\n");
|
||||||
|
LLAMA_LOG_WARN("Split mode 'graph' for Mimo2 does not work with more than 2 GPUs\n");
|
||||||
|
LLAMA_LOG_WARN(" => setting max_gpu to 2\n");
|
||||||
|
LLAMA_LOG_WARN("================================================================\n\n");
|
||||||
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|||||||
Reference in New Issue
Block a user