mirror of
https://github.com/theroyallab/tabbyAPI.git
synced 2026-03-14 15:57:27 +00:00
Model: Add tokens in responses
Signed-off-by: kingbri <bdashore3@proton.me>
This commit is contained in:
2
model.py
2
model.py
@@ -355,4 +355,4 @@ class ModelContainer:
|
||||
if eos or generated_tokens == max_tokens: break
|
||||
|
||||
elapsed_time = last_chunk_time - start_time
|
||||
print(f"Response generated in {round(elapsed_time, 2)} seconds ({round(generated_tokens / elapsed_time, 2)} T/s)")
|
||||
print(f"Response: {round(generated_tokens, 2)} tokens generated in {round(elapsed_time, 2)} seconds ({round(generated_tokens / elapsed_time, 2)} T/s)")
|
||||
|
||||
Reference in New Issue
Block a user