From d5924781958475c5ec61d8e64cb8b1d98f6c240d Mon Sep 17 00:00:00 2001 From: "T. M." Date: Fri, 25 Jul 2025 05:26:30 +0000 Subject: [PATCH] correct value for n_ctx --- examples/server/server.cpp | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/examples/server/server.cpp b/examples/server/server.cpp index 401023cf..18ae25c7 100644 --- a/examples/server/server.cpp +++ b/examples/server/server.cpp @@ -910,7 +910,7 @@ struct server_context { gpt_params params_dft; params_dft.model = params.model_draft; - params_dft.n_ctx = params.n_gpu_layers_draft == 0 ? params.n_ctx / params.n_parallel : params.n_gpu_layers_draft; + params_dft.n_ctx = params.n_gpu_layers_draft == 0 ? params.n_ctx / params.n_parallel : params.n_ctx; // TODO: add params_base.speculative.n_ctx params_dft.n_gpu_layers = params.n_gpu_layers_draft; params_dft.n_parallel = 1; params_dft.cache_type_k = params.cache_type_k;