mirror of
https://github.com/theroyallab/tabbyAPI.git
synced 2026-04-28 02:01:24 +00:00
Merge pull request #112 from DocShotgun/main
Separate new prompt tokens from those reused from cache in metric logging
This commit is contained in:
@@ -1144,6 +1144,7 @@ class ExllamaV2Container:
|
||||
log_metrics(
|
||||
result.get("time_enqueued"),
|
||||
result.get("prompt_tokens"),
|
||||
result.get("cached_tokens"),
|
||||
result.get("time_prefill"),
|
||||
result.get("new_tokens"),
|
||||
result.get("time_generate"),
|
||||
|
||||
Reference in New Issue
Block a user