Adaptive p: history update fix + temp as flag (#1213)

* adaptive_p: fix history update + use current probability for high temp * adaptive_p: fix history update bug, update with current probability if temp is high * replace temp-as-signal with server argument * adaptive_p: rename ema_w_cur_p to updt_w_cur * delete test code
2026-02-11 00:40:09 +00:00 · 2026-02-03 00:36:12 -05:00
parent 589d80f677
commit b86d8024a5
7 changed files with 30 additions and 7 deletions
--- a/common/sampling.cpp
+++ b/common/sampling.cpp
@@ -120,7 +120,7 @@ struct llama_sampling_context * common_sampler_init(const struct llama_vocab* vo
            {
                GGML_ASSERT(vocab);
                auto n_vocab = llama_vocab_n_tokens(vocab);
-                result->adapt_p_ctx = llama_init_adaptive_p(n_vocab, params.adaptive_target, params.adaptive_decay, result->rng());
+                result->adapt_p_ctx = llama_init_adaptive_p(n_vocab, params.adaptive_target, params.adaptive_decay, params.adaptive_updt_w_cur, result->rng());
                break;
            }
            default: