save checkpoint during pp

2026-04-22 23:49:23 +00:00 · 2026-02-25 19:05:54 -06:00
parent 233898704c
commit 7962e9a4b3
4 changed files with 47 additions and 28 deletions
--- a/examples/server/server-context.h
+++ b/examples/server/server-context.h
@@ -104,6 +104,8 @@ struct server_slot {

    void prompt_load(server_prompt_cache& prompt_cache, const server_tokens& tokens);

+    size_t checkpoint_pos = 0;
+
    // sampling
    llama_token sampled; // in speculative mode, this is the last accepted token
    llama_tokens drafted;
@@ -358,5 +360,7 @@ struct server_context {

    void apply_checkpoint(server_slot & slot);

+    void create_checkpoint_at_interval(server_slot & slot, const gpt_params & params_base);
+
    void release_slot_after_final_response(server_slot & slot);
 };