mirror of
https://github.com/turboderp-org/exllamav3.git
synced 2026-04-29 10:41:26 +00:00
15 lines
447 B
JSON
15 lines
447 B
JSON
[
|
|
{
|
|
"model_dir": "/mnt/str/eval_models/llama3.1-70b-instruct/vptq/v8-k65536-0-woft",
|
|
"load_fn": "transformers_auto",
|
|
"fwd_fn": "transformers",
|
|
"label": "VPTQ v8-k65536-0-woft"
|
|
},
|
|
{
|
|
"model_dir": "/mnt/str/eval_models/llama3.1-70b-instruct/vptq/v16-k65536-32768-woft",
|
|
"load_fn": "transformers_auto",
|
|
"fwd_fn": "transformers",
|
|
"label": "VPTQ v16-k65536-32768-woft"
|
|
}
|
|
]
|