Disable ring reduction for now

2026-03-13 07:20:15 +00:00 · 2026-01-06 13:14:30 +00:00
parent d9236392cf
commit 289aadb9d4
2 changed files with 2 additions and 2 deletions
--- a/ggml/src/ggml-backend.cpp
+++ b/ggml/src/ggml-backend.cpp
@@ -1111,7 +1111,7 @@ static bool ggml_is_view_op(enum ggml_op op) {
 #endif

 #ifndef GGML_SCHED_MAX_COPIES
-#define GGML_SCHED_MAX_COPIES 4
+#define GGML_SCHED_MAX_COPIES 1
 #endif

 struct ggml_backend_sched_split {
--- a/ggml/src/ggml-cuda/reduce.cu
+++ b/ggml/src/ggml-cuda/reduce.cu
@@ -196,7 +196,7 @@ void ggml_cuda_op_reduce([[maybe_unused]] ggml_backend_cuda_context & ctx, ggml_
    //   i = 0, peer = 1, ichunk = 1 -> copy part 1 from device 1, device 0 now has parts 0, 1, 2, 3
    //   etc.
    //
-    if (dst->ne[1] >= 32) {
+    if (false && dst->ne[1] >= 32) {
        auto nelem = ggml_nelements(dst);
        auto elem_size = ggml_element_size(dst);
        auto nelem_per_device = (nelem + nhave - 1)/nhave;