More output in SD example

2026-04-20 14:29:28 +00:00 · 2023-11-10 20:16:08 +01:00
parent 898a5b909c
commit b302e310c8
2 changed files with 21 additions and 11 deletions
--- a/examples/speculative.py
+++ b/examples/speculative.py
@@ -119,3 +119,10 @@ print()

 test_gen(speculative_generator, gen_prompt, gen_settings, gen_max_tokens)

+efficiency, accuracy, total_tokens, total_draft_tokens, accepted_draft_tokens = speculative_generator.get_sd_stats()
+
+print("efficiency:", efficiency)
+print("accuracy:", accuracy)
+print("total_tokens:", total_tokens)
+print("total_draft_tokens:", total_draft_tokens)
+print("accepted_draft_tokens:", accepted_draft_tokens)
--- a/tests/test_mmlu.py
+++ b/tests/test_mmlu.py
@@ -14,18 +14,21 @@ import torch

 # Models to test

-model_base = "/mnt/str/models/_exl2/llama2-70b-chat-exl2/"
+#model_base = "/mnt/str/models/_exl2"
+
+model_base = "/mnt/str/models/_gptq/TheBloke_Yi-34B-GPTQ/"

 # variants = [v for v in os.listdir(model_base) if os.path.isdir(os.path.join(model_base, v))]

 variants = \
 [
-    "3.0bpw",
-    "4.0bpw",
-    "4.65bpw",
+    "",
+    # "goliath-120b-exl2/3.0bpw",
+    # "llama2-70b-exl2/3.0bpw",
+    # "llama2-70b-exl2/4.65bpw",
 ]

-gpu_split = (19.5, 24)
+gpu_split = (21.2, 24)

 qa_set = "cais/mmlu"
 qa_split = "test"
@@ -33,12 +36,12 @@ qa_split = "test"
 categories = \
 [
    "anatomy",
-    "computer_security",
-    "formal_logic",
-    "logical_fallacies",
-    "computer_security",
-    "philosophy",
-    "nutrition",
+    # "computer_security",
+    # "formal_logic",
+    # "logical_fallacies",
+    # "computer_security",
+    # "philosophy",
+    # "nutrition",
 ]

 examples_per_category = 3