mirror of
https://github.com/ikawrakow/ik_llama.cpp.git
synced 2026-02-27 16:44:21 +00:00
server: enable checkpoint for recurrent models (#1310)
* server: enable checkpoint for recurrent models create checkpoint after cancel fix ban string and rm context during rewind add checkpoint interval only save recurrent cache * save checkpoint during pp --------- Co-authored-by: firecoperana <firecoperana>
This commit is contained in:
@@ -344,6 +344,8 @@ using server_task_result_ptr = std::unique_ptr<server_task_result>;
|
||||
struct server_prompt_checkpoint {
|
||||
llama_pos pos_min;
|
||||
llama_pos pos_max;
|
||||
llama_pos pos_min_prompt;
|
||||
llama_pos pos_max_prompt;
|
||||
|
||||
std::vector<uint8_t> data;
|
||||
|
||||
|
||||
Reference in New Issue
Block a user