mirror of
https://github.com/ikawrakow/ik_llama.cpp.git
synced 2026-02-24 07:04:11 +00:00
correct value for n_ctx
This commit is contained in:
@@ -910,7 +910,7 @@ struct server_context {
|
||||
|
||||
gpt_params params_dft;
|
||||
params_dft.model = params.model_draft;
|
||||
params_dft.n_ctx = params.n_gpu_layers_draft == 0 ? params.n_ctx / params.n_parallel : params.n_gpu_layers_draft;
|
||||
params_dft.n_ctx = params.n_gpu_layers_draft == 0 ? params.n_ctx / params.n_parallel : params.n_ctx; // TODO: add params_base.speculative.n_ctx
|
||||
params_dft.n_gpu_layers = params.n_gpu_layers_draft;
|
||||
params_dft.n_parallel = 1;
|
||||
params_dft.cache_type_k = params.cache_type_k;
|
||||
|
||||
Reference in New Issue
Block a user