mirror of
https://github.com/turboderp-org/exllamav3.git
synced 2026-05-11 00:10:13 +00:00
20 lines
558 B
JSON
20 lines
558 B
JSON
[
|
|
{
|
|
"model_dir": "/mnt/str/models/llama3.1-70b-instruct/qtip/2bit-hyb-yaqa",
|
|
"load_fn": "qtip",
|
|
"fwd_fn": "qtip",
|
|
"label": "QTIP 2bit-HYB-YAQA"
|
|
},
|
|
{
|
|
"model_dir": "/mnt/str/models/llama3.1-70b-instruct/qtip/3bit-hyb-yaqa",
|
|
"load_fn": "qtip",
|
|
"fwd_fn": "qtip",
|
|
"label": "QTIP 3bit-HYB-YAQA"
|
|
},
|
|
{
|
|
"model_dir": "/mnt/str/models/llama3.1-70b-instruct/qtip/4bit-hyb-yaqa",
|
|
"load_fn": "qtip",
|
|
"fwd_fn": "qtip",
|
|
"label": "QTIP 4bit-HYB-YAQA"
|
|
},
|
|
] |