mirror of
https://github.com/kvcache-ai/ktransformers.git
synced 2026-04-30 03:01:16 +00:00
fix bug
This commit is contained in:
@@ -38,6 +38,7 @@ To install KTransformers, follow the official [Installation Guide](https://kvcac
|
||||
python ktransformers/server/main.py \
|
||||
--port 10021 \
|
||||
--model_path path-to-Qwen3-Next-80B-A3B-Thinking \
|
||||
--gguf_path path-to-Qwen3-Next-80B-A3B-Thinking \
|
||||
--model_name Qwen3NextForCausalLM \
|
||||
--optimize_config_path <local_path>/ktransformers/optimize/optimize_rules/Qwen3Next-serve.yaml \
|
||||
--max_new_tokens 1024 \
|
||||
|
||||
Reference in New Issue
Block a user