From 289aadb9d43eac010dee25863544a51b98e7abb7 Mon Sep 17 00:00:00 2001 From: Iwan Kawrakow Date: Tue, 6 Jan 2026 13:14:30 +0000 Subject: [PATCH] Disable ring reduction for now --- ggml/src/ggml-backend.cpp | 2 +- ggml/src/ggml-cuda/reduce.cu | 2 +- 2 files changed, 2 insertions(+), 2 deletions(-) diff --git a/ggml/src/ggml-backend.cpp b/ggml/src/ggml-backend.cpp index d780e891..a6524b88 100644 --- a/ggml/src/ggml-backend.cpp +++ b/ggml/src/ggml-backend.cpp @@ -1111,7 +1111,7 @@ static bool ggml_is_view_op(enum ggml_op op) { #endif #ifndef GGML_SCHED_MAX_COPIES -#define GGML_SCHED_MAX_COPIES 4 +#define GGML_SCHED_MAX_COPIES 1 #endif struct ggml_backend_sched_split { diff --git a/ggml/src/ggml-cuda/reduce.cu b/ggml/src/ggml-cuda/reduce.cu index 53d54f74..81a48d88 100644 --- a/ggml/src/ggml-cuda/reduce.cu +++ b/ggml/src/ggml-cuda/reduce.cu @@ -196,7 +196,7 @@ void ggml_cuda_op_reduce([[maybe_unused]] ggml_backend_cuda_context & ctx, ggml_ // i = 0, peer = 1, ichunk = 1 -> copy part 1 from device 1, device 0 now has parts 0, 1, 2, 3 // etc. // - if (dst->ne[1] >= 32) { + if (false && dst->ne[1] >= 32) { auto nelem = ggml_nelements(dst); auto elem_size = ggml_element_size(dst); auto nelem_per_device = (nelem + nhave - 1)/nhave;