server: add checkpoint tolerance and fix grammar_trigger init (#1346)

Co-authored-by: firecoperana <firecoperana>
2026-04-22 15:39:23 +00:00 · 2026-03-02 00:45:32 -06:00
parent a568e12c8f
commit 8f9e19d57c
4 changed files with 27 additions and 4 deletions
--- a/examples/server/server-context.h
+++ b/examples/server/server-context.h
@@ -105,6 +105,7 @@ struct server_slot {
    void prompt_load(server_prompt_cache& prompt_cache, const server_tokens& tokens);

    size_t checkpoint_pos = 0;
+    bool do_checkpoint = false;

    // sampling
    llama_token sampled; // in speculative mode, this is the last accepted token