Separate graph compute implementation for split mode graph

This commit is contained in:
Iwan Kawrakow
2025-12-11 16:53:54 +00:00
parent e6603ec882
commit 07ae4b1ef0
3 changed files with 165 additions and 243 deletions

View File

@@ -211,6 +211,7 @@ extern "C" {
// enable or disable op offload for a given op
GGML_API void ggml_backend_sched_set_op_offload(ggml_backend_sched_t sched, enum ggml_op op, bool on_or_off);
GGML_API void ggml_backend_sched_set_only_active_experts(ggml_backend_sched_t sched, bool on_or_off);
GGML_API void ggml_backend_sched_set_split_mode_graph(ggml_backend_sched_t sched, bool on_or_off);
//
// Utils