mirror of
https://github.com/turboderp-org/exllamav3.git
synced 2026-05-13 09:15:48 +00:00
17 lines
612 B
JSON
17 lines
612 B
JSON
{
|
|
"model": "/mnt/str/models/qwen3.5-27b/exl3/4.00bpw",
|
|
"stream": true,
|
|
"messages": [
|
|
{
|
|
"role": "system",
|
|
"content": "Given the following conversation, relevant context, and a follow up question, reply with an answer to the current question the user is asking. Return only your response to the question given the above information following the users instructions as needed."
|
|
},
|
|
{
|
|
"role": "user",
|
|
"content": "Write a story about a cat that goes on an adventure."
|
|
}
|
|
],
|
|
"temperature": 0.7,
|
|
"max_tokens": 4096
|
|
}
|