mirror of
https://github.com/ikawrakow/ik_llama.cpp.git
synced 2026-04-25 08:59:30 +00:00
server: exclude thinking tokens when finding the slot (#1079)
refactor find slot enable by default Fix load prompt rename variables Co-authored-by: firecoperana <firecoperana>
This commit is contained in:
@@ -177,6 +177,7 @@ struct server_prompt {
|
||||
server_tokens tokens;
|
||||
int n_kept_prompt;
|
||||
int n_discarded_prompt;
|
||||
thinking_tokens think_tokens;
|
||||
|
||||
std::vector<uint8_t> data;
|
||||
|
||||
|
||||
Reference in New Issue
Block a user