Files
exllamav3/eval/spec/llama3.1-8b-instruct_exl3.json
2025-04-06 14:42:49 +02:00

74 lines
2.2 KiB
JSON

[
{
"load_fn": "exllamav3",
"fwd_fn": "exllamav3",
"label": "EXL3 1.7bpw H3",
"model_dir": "/mnt/str/eval_models/llama3.1-8b-instruct/exl3/1.7bpw_H3/"
},
{
"load_fn": "exllamav3",
"fwd_fn": "exllamav3",
"label": "EXL3 1.8bpw H3",
"model_dir": "/mnt/str/eval_models/llama3.1-8b-instruct/exl3/1.8bpw_H3/"
},
{
"load_fn": "exllamav3",
"fwd_fn": "exllamav3",
"label": "EXL3 1.9bpw H3",
"model_dir": "/mnt/str/eval_models/llama3.1-8b-instruct/exl3/1.9bpw_H3/"
},
{
"load_fn": "exllamav3",
"fwd_fn": "exllamav3",
"label": "EXL3 2.0bpw H6",
"model_dir": "/mnt/str/eval_models/llama3.1-8b-instruct/exl3/2.0bpw/"
},
{
"load_fn": "exllamav3",
"fwd_fn": "exllamav3",
"label": "EXL3 2.25bpw H6",
"model_dir": "/mnt/str/eval_models/llama3.1-8b-instruct/exl3/2.25bpw/"
},
{
"load_fn": "exllamav3",
"fwd_fn": "exllamav3",
"label": "EXL3 2.5bpw H6",
"model_dir": "/mnt/str/eval_models/llama3.1-8b-instruct/exl3/2.5bpw/"
},
{
"load_fn": "exllamav3",
"fwd_fn": "exllamav3",
"label": "EXL3 3.0bpw H6",
"model_dir": "/mnt/str/eval_models/llama3.1-8b-instruct/exl3/3.0bpw/"
},
{
"load_fn": "exllamav3",
"fwd_fn": "exllamav3",
"label": "EXL3 3.5bpw H6",
"model_dir": "/mnt/str/eval_models/llama3.1-8b-instruct/exl3/3.5bpw/"
},
{
"load_fn": "exllamav3",
"fwd_fn": "exllamav3",
"label": "EXL3 4.0bpw H6",
"model_dir": "/mnt/str/eval_models/llama3.1-8b-instruct/exl3/4.0bpw/"
},
{
"load_fn": "exllamav3",
"fwd_fn": "exllamav3",
"label": "EXL3 5.0bpw H6",
"model_dir": "/mnt/str/eval_models/llama3.1-8b-instruct/exl3/5.0bpw/"
},
{
"load_fn": "exllamav3",
"fwd_fn": "exllamav3",
"label": "EXL3 6.0bpw H6",
"model_dir": "/mnt/str/eval_models/llama3.1-8b-instruct/exl3/6.0bpw/"
},
{
"load_fn": "exllamav3",
"fwd_fn": "exllamav3",
"label": "EXL3 8.0bpw H6",
"model_dir": "/mnt/str/eval_models/llama3.1-8b-instruct/exl3/8.0bpw/"
}
]