More output in SD example

This commit is contained in:
turboderp
2023-11-10 20:16:08 +01:00
parent 898a5b909c
commit b302e310c8
2 changed files with 21 additions and 11 deletions

View File

@@ -119,3 +119,10 @@ print()
test_gen(speculative_generator, gen_prompt, gen_settings, gen_max_tokens)
efficiency, accuracy, total_tokens, total_draft_tokens, accepted_draft_tokens = speculative_generator.get_sd_stats()
print("efficiency:", efficiency)
print("accuracy:", accuracy)
print("total_tokens:", total_tokens)
print("total_draft_tokens:", total_draft_tokens)
print("accepted_draft_tokens:", accepted_draft_tokens)

View File

@@ -14,18 +14,21 @@ import torch
# Models to test
model_base = "/mnt/str/models/_exl2/llama2-70b-chat-exl2/"
#model_base = "/mnt/str/models/_exl2"
model_base = "/mnt/str/models/_gptq/TheBloke_Yi-34B-GPTQ/"
# variants = [v for v in os.listdir(model_base) if os.path.isdir(os.path.join(model_base, v))]
variants = \
[
"3.0bpw",
"4.0bpw",
"4.65bpw",
"",
# "goliath-120b-exl2/3.0bpw",
# "llama2-70b-exl2/3.0bpw",
# "llama2-70b-exl2/4.65bpw",
]
gpu_split = (19.5, 24)
gpu_split = (21.2, 24)
qa_set = "cais/mmlu"
qa_split = "test"
@@ -33,12 +36,12 @@ qa_split = "test"
categories = \
[
"anatomy",
"computer_security",
"formal_logic",
"logical_fallacies",
"computer_security",
"philosophy",
"nutrition",
# "computer_security",
# "formal_logic",
# "logical_fallacies",
# "computer_security",
# "philosophy",
# "nutrition",
]
examples_per_category = 3