mirror of
https://github.com/theroyallab/tabbyAPI.git
synced 2026-04-20 14:28:54 +00:00
Logging: Clarify new vs cached tokens in prompt processing
This commit is contained in:
@@ -1125,6 +1125,7 @@ class ExllamaV2Container:
|
||||
log_metrics(
|
||||
result.get("time_enqueued"),
|
||||
result.get("prompt_tokens"),
|
||||
result.get("cached_tokens"),
|
||||
result.get("time_prefill"),
|
||||
result.get("new_tokens"),
|
||||
result.get("time_generate"),
|
||||
|
||||
Reference in New Issue
Block a user