This commit is contained in:
djw
2025-09-16 13:21:58 +00:00
parent a44b710649
commit 0437660e62
4 changed files with 31 additions and 12 deletions

View File

@@ -38,6 +38,7 @@ To install KTransformers, follow the official [Installation Guide](https://kvcac
python ktransformers/server/main.py \
--port 10021 \
--model_path path-to-Qwen3-Next-80B-A3B-Thinking \
--gguf_path path-to-Qwen3-Next-80B-A3B-Thinking \
--model_name Qwen3NextForCausalLM \
--optimize_config_path <local_path>/ktransformers/optimize/optimize_rules/Qwen3Next-serve.yaml \
--max_new_tokens 1024 \