mirror of
https://github.com/turboderp-org/exllamav3.git
synced 2026-04-27 09:43:28 +00:00
20 lines
524 B
JSON
20 lines
524 B
JSON
[
|
|
{
|
|
"model_dir": "/mnt/str/models/llama3.1-8b-instruct/qtip/2bit-hyb",
|
|
"load_fn": "qtip",
|
|
"fwd_fn": "qtip",
|
|
"label": "QTIP 2bit-HYB"
|
|
},
|
|
{
|
|
"model_dir": "/mnt/str/models/llama3.1-8b-instruct/qtip/3bit-hyb",
|
|
"load_fn": "qtip",
|
|
"fwd_fn": "qtip",
|
|
"label": "QTIP 3bit-HYB"
|
|
},
|
|
{
|
|
"model_dir": "/mnt/str/models/llama3.1-8b-instruct/qtip/4bit-hyb",
|
|
"load_fn": "qtip",
|
|
"fwd_fn": "qtip",
|
|
"label": "QTIP 4bit-HYB"
|
|
}
|
|
] |