mirror of
https://github.com/kvcache-ai/ktransformers.git
synced 2026-04-19 22:09:10 +00:00
* [feat]: simplify sglang installation with submodule, auto-sync CI, and version alignment
- Add kvcache-ai/sglang as git submodule at third_party/sglang (branch = main)
- Add top-level install.sh for one-click source installation (sglang + kt-kernel)
- Add sglang-kt as hard dependency in kt-kernel/pyproject.toml
- Add CI workflow to auto-sync sglang submodule daily and create PR
- Add CI workflow to build and publish sglang-kt to PyPI
- Integrate sglang-kt build into release-pypi.yml (version.py bump publishes both packages)
- Align sglang-kt version with ktransformers via SGLANG_KT_VERSION env var injection
- Update Dockerfile to use submodule and inject aligned version
- Update all 13 doc files, CLI hints, and i18n strings to reference new install methods
Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
* [build]: bump version to 0.5.2
Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
* [build]: rename PyPI package from kt-kernel to ktransformers
Users can now `pip install ktransformers` to get everything
(sglang-kt is auto-installed as a dependency).
Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
* Revert "[build]: rename PyPI package from kt-kernel to ktransformers"
This reverts commit e0cbbf6364.
* [build]: add ktransformers meta-package for PyPI
`pip install ktransformers` now works as a single install command.
It pulls kt-kernel (which in turn pulls sglang-kt).
Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
* [fix]: show sglang-kt package version in kt version command
- Prioritize sglang-kt package version (aligned with ktransformers)
over sglang internal __version__
- Update display name from "sglang" to "sglang-kt"
Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
* [fix]: improve sglang-kt detection in kt doctor and kt version
Recognize sglang-kt package name as proof of kvcache-ai fork installation.
Previously both commands fell through to "PyPI (not recommended)" for
non-editable local source installs. Now version.py reuses the centralized
check_sglang_installation() logic.
Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
* [build]: bump version to 0.5.2.post1
Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
---------
Co-authored-by: Claude Opus 4.6 <noreply@anthropic.com>
420 lines
14 KiB
Python
420 lines
14 KiB
Python
"""
|
|
SGLang installation checker and installation instructions provider.
|
|
|
|
This module provides utilities to:
|
|
- Check if SGLang is installed and get its metadata
|
|
- Provide installation instructions when SGLang is not found
|
|
"""
|
|
|
|
import subprocess
|
|
import sys
|
|
from pathlib import Path
|
|
from typing import Optional
|
|
|
|
from kt_kernel.cli.i18n import t
|
|
from kt_kernel.cli.utils.console import console
|
|
|
|
|
|
def check_sglang_installation() -> dict:
|
|
"""Check if SGLang is installed and get its metadata.
|
|
|
|
Returns:
|
|
dict with keys:
|
|
- installed: bool
|
|
- version: str or None
|
|
- location: str or None (installation path)
|
|
- editable: bool (whether installed in editable mode)
|
|
- git_info: dict or None (git remote and branch if available)
|
|
- from_source: bool (whether installed from source repository)
|
|
"""
|
|
try:
|
|
# Try to import sglang
|
|
import sglang
|
|
|
|
version = getattr(sglang, "__version__", None)
|
|
|
|
# Use pip show to get detailed package information
|
|
location = None
|
|
editable = False
|
|
git_info = None
|
|
from_source = False
|
|
is_kvcache_fork = False # True if installed as sglang-kt package
|
|
|
|
try:
|
|
# Get pip show output (try sglang-kt first, then sglang)
|
|
result = subprocess.run(
|
|
[sys.executable, "-m", "pip", "show", "sglang-kt"],
|
|
capture_output=True,
|
|
text=True,
|
|
timeout=10,
|
|
)
|
|
if result.returncode == 0:
|
|
is_kvcache_fork = True # sglang-kt package name proves it's the fork
|
|
else:
|
|
result = subprocess.run(
|
|
[sys.executable, "-m", "pip", "show", "sglang"],
|
|
capture_output=True,
|
|
text=True,
|
|
timeout=10,
|
|
)
|
|
|
|
if result.returncode == 0:
|
|
pip_info = {}
|
|
for line in result.stdout.split("\n"):
|
|
if ":" in line:
|
|
key, value = line.split(":", 1)
|
|
pip_info[key.strip()] = value.strip()
|
|
|
|
location = pip_info.get("Location")
|
|
editable_location = pip_info.get("Editable project location")
|
|
|
|
if editable_location:
|
|
editable = True
|
|
location = editable_location
|
|
except (subprocess.TimeoutExpired, FileNotFoundError, OSError):
|
|
# Fallback to module location
|
|
if hasattr(sglang, "__file__") and sglang.__file__:
|
|
location = str(Path(sglang.__file__).parent.parent)
|
|
|
|
# Check if it's installed from source (has .git directory)
|
|
if location:
|
|
git_root = None
|
|
check_path = Path(location)
|
|
|
|
# Check current directory and up to 2 parent directories
|
|
for _ in range(3):
|
|
git_dir = check_path / ".git"
|
|
if git_dir.exists():
|
|
git_root = check_path
|
|
from_source = True
|
|
break
|
|
if check_path.parent == check_path: # Reached root
|
|
break
|
|
check_path = check_path.parent
|
|
|
|
if from_source and git_root:
|
|
# Try to get git remote and branch info
|
|
try:
|
|
# Get remote URL
|
|
result = subprocess.run(
|
|
["git", "remote", "get-url", "origin"],
|
|
cwd=git_root,
|
|
capture_output=True,
|
|
text=True,
|
|
timeout=5,
|
|
)
|
|
remote_url = result.stdout.strip() if result.returncode == 0 else None
|
|
|
|
# Extract org/repo from URL
|
|
remote_short = None
|
|
if remote_url:
|
|
# Handle both https and git@ URLs
|
|
if "github.com" in remote_url:
|
|
parts = remote_url.rstrip("/").replace(".git", "").split("github.com")[-1]
|
|
remote_short = parts.lstrip("/").lstrip(":")
|
|
|
|
# Get current branch
|
|
result = subprocess.run(
|
|
["git", "branch", "--show-current"],
|
|
cwd=git_root,
|
|
capture_output=True,
|
|
text=True,
|
|
timeout=5,
|
|
)
|
|
branch = result.stdout.strip() if result.returncode == 0 else None
|
|
|
|
if remote_url or branch:
|
|
git_info = {
|
|
"remote": remote_short or remote_url,
|
|
"branch": branch,
|
|
}
|
|
except (subprocess.TimeoutExpired, FileNotFoundError, OSError):
|
|
pass
|
|
|
|
return {
|
|
"installed": True,
|
|
"version": version,
|
|
"location": location,
|
|
"editable": editable,
|
|
"git_info": git_info,
|
|
"from_source": from_source,
|
|
"is_kvcache_fork": is_kvcache_fork,
|
|
}
|
|
except ImportError:
|
|
return {
|
|
"installed": False,
|
|
"version": None,
|
|
"location": None,
|
|
"editable": False,
|
|
"git_info": None,
|
|
"from_source": False,
|
|
"is_kvcache_fork": False,
|
|
}
|
|
|
|
|
|
def get_sglang_install_instructions(lang: Optional[str] = None) -> str:
|
|
"""Get SGLang installation instructions.
|
|
|
|
Args:
|
|
lang: Language code ('en' or 'zh'). If None, uses current language setting.
|
|
|
|
Returns:
|
|
Formatted installation instructions string.
|
|
"""
|
|
from kt_kernel.cli.i18n import get_lang
|
|
|
|
if lang is None:
|
|
lang = get_lang()
|
|
|
|
if lang == "zh":
|
|
return """
|
|
[bold yellow]SGLang \u672a\u5b89\u88c5[/bold yellow]
|
|
|
|
\u8bf7\u9009\u62e9\u4ee5\u4e0b\u65b9\u5f0f\u4e4b\u4e00\u5b89\u88c5 SGLang (kvcache-ai \u5206\u652f):
|
|
|
|
[bold]\u65b9\u5f0f A - \u4e00\u952e\u5b89\u88c5 (\u63a8\u8350):[/bold]
|
|
\u4ece ktransformers \u6839\u76ee\u5f55\u8fd0\u884c:
|
|
[cyan]./install.sh[/cyan]
|
|
|
|
[bold]\u65b9\u5f0f B - pip \u5b89\u88c5:[/bold]
|
|
[cyan]pip install sglang-kt[/cyan]
|
|
|
|
[bold]\u65b9\u5f0f C - \u4ece\u6e90\u7801\u5b89\u88c5:[/bold]
|
|
git clone --recursive https://github.com/kvcache-ai/ktransformers.git
|
|
cd ktransformers
|
|
pip install "third_party/sglang/python[all]"
|
|
|
|
[dim]\u6ce8\u610f: \u8bf7\u786e\u4fdd\u5728\u6b63\u786e\u7684 Python \u73af\u5883\u4e2d\u6267\u884c\u4ee5\u4e0a\u547d\u4ee4[/dim]
|
|
"""
|
|
else:
|
|
return """
|
|
[bold yellow]SGLang is not installed[/bold yellow]
|
|
|
|
Install SGLang (kvcache-ai fork) using one of these methods:
|
|
|
|
[bold]Option A - One-click install (recommended):[/bold]
|
|
From the ktransformers root directory, run:
|
|
[cyan]./install.sh[/cyan]
|
|
|
|
[bold]Option B - pip install:[/bold]
|
|
[cyan]pip install sglang-kt[/cyan]
|
|
|
|
[bold]Option C - From source:[/bold]
|
|
git clone --recursive https://github.com/kvcache-ai/ktransformers.git
|
|
cd ktransformers
|
|
pip install "third_party/sglang/python[all]"
|
|
|
|
[dim]Note: Make sure to run these commands in the correct Python environment[/dim]
|
|
"""
|
|
|
|
|
|
def print_sglang_install_instructions() -> None:
|
|
"""Print SGLang installation instructions to console."""
|
|
instructions = get_sglang_install_instructions()
|
|
console.print(instructions)
|
|
|
|
|
|
def check_sglang_and_warn() -> bool:
|
|
"""Check if SGLang is installed, print warning if not.
|
|
|
|
Returns:
|
|
True if SGLang is installed, False otherwise.
|
|
"""
|
|
info = check_sglang_installation()
|
|
|
|
if not info["installed"]:
|
|
print_sglang_install_instructions()
|
|
return False
|
|
|
|
# Check if installed from PyPI (not recommended)
|
|
if info["installed"] and not info["from_source"]:
|
|
from kt_kernel.cli.utils.console import print_warning
|
|
|
|
print_warning(t("sglang_pypi_warning"))
|
|
console.print()
|
|
console.print("[dim]" + t("sglang_recommend_source") + "[/dim]")
|
|
console.print()
|
|
|
|
return True
|
|
|
|
|
|
def _get_sglang_kt_kernel_cache_path() -> Path:
|
|
"""Get the path to the sglang kt-kernel support cache file."""
|
|
cache_dir = Path.home() / ".ktransformers" / "cache"
|
|
cache_dir.mkdir(parents=True, exist_ok=True)
|
|
return cache_dir / "sglang_kt_kernel_supported"
|
|
|
|
|
|
def _is_sglang_kt_kernel_cache_valid() -> bool:
|
|
"""Check if the sglang kt-kernel support cache is valid.
|
|
|
|
The cache is considered valid if:
|
|
1. The cache file exists
|
|
2. The cache file contains 'true' (indicating previous check passed)
|
|
|
|
Returns:
|
|
True if cache is valid and indicates support, False otherwise.
|
|
"""
|
|
cache_path = _get_sglang_kt_kernel_cache_path()
|
|
if cache_path.exists():
|
|
try:
|
|
content = cache_path.read_text().strip().lower()
|
|
return content == "true"
|
|
except (OSError, IOError):
|
|
pass
|
|
return False
|
|
|
|
|
|
def _save_sglang_kt_kernel_cache(supported: bool) -> None:
|
|
"""Save the sglang kt-kernel support check result to cache."""
|
|
cache_path = _get_sglang_kt_kernel_cache_path()
|
|
try:
|
|
cache_path.write_text("true" if supported else "false")
|
|
except (OSError, IOError):
|
|
pass # Ignore cache write errors
|
|
|
|
|
|
def clear_sglang_kt_kernel_cache() -> None:
|
|
"""Clear the sglang kt-kernel support cache, forcing a re-check on next run."""
|
|
cache_path = _get_sglang_kt_kernel_cache_path()
|
|
try:
|
|
if cache_path.exists():
|
|
cache_path.unlink()
|
|
except (OSError, IOError):
|
|
pass
|
|
|
|
|
|
def check_sglang_kt_kernel_support(use_cache: bool = True, silent: bool = False) -> dict:
|
|
"""Check if SGLang supports kt-kernel parameters (--kt-gpu-prefill-token-threshold).
|
|
|
|
This function runs `python -m sglang.launch_server --help` and checks if the
|
|
output contains the `--kt-gpu-prefill-token-threshold` parameter. This parameter
|
|
is only available in the kvcache-ai/sglang fork, not in the official sglang.
|
|
|
|
The result is cached after the first successful check to avoid repeated checks.
|
|
|
|
Args:
|
|
use_cache: If True, use cached result if available. Default is True.
|
|
silent: If True, don't print checking message. Default is False.
|
|
|
|
Returns:
|
|
dict with keys:
|
|
- supported: bool - True if kt-kernel parameters are supported
|
|
- help_output: str or None - The help output from sglang.launch_server
|
|
- error: str or None - Error message if check failed
|
|
- from_cache: bool - True if result was from cache
|
|
"""
|
|
from kt_kernel.cli.utils.console import print_step
|
|
|
|
# Check cache first
|
|
if use_cache and _is_sglang_kt_kernel_cache_valid():
|
|
return {
|
|
"supported": True,
|
|
"help_output": None,
|
|
"error": None,
|
|
"from_cache": True,
|
|
}
|
|
|
|
# Print checking message
|
|
if not silent:
|
|
print_step(t("sglang_checking_kt_kernel_support"))
|
|
|
|
try:
|
|
result = subprocess.run(
|
|
[sys.executable, "-m", "sglang.launch_server", "--help"],
|
|
capture_output=True,
|
|
text=True,
|
|
timeout=30,
|
|
)
|
|
|
|
help_output = result.stdout + result.stderr
|
|
|
|
# Check if --kt-gpu-prefill-token-threshold is in the help output
|
|
supported = "--kt-gpu-prefill-token-threshold" in help_output
|
|
|
|
# Save to cache if supported
|
|
if supported:
|
|
_save_sglang_kt_kernel_cache(True)
|
|
|
|
return {
|
|
"supported": supported,
|
|
"help_output": help_output,
|
|
"error": None,
|
|
"from_cache": False,
|
|
}
|
|
|
|
except subprocess.TimeoutExpired:
|
|
return {
|
|
"supported": False,
|
|
"help_output": None,
|
|
"error": "Timeout while checking sglang.launch_server --help",
|
|
"from_cache": False,
|
|
}
|
|
except FileNotFoundError:
|
|
return {
|
|
"supported": False,
|
|
"help_output": None,
|
|
"error": "Python interpreter not found",
|
|
"from_cache": False,
|
|
}
|
|
except Exception as e:
|
|
return {
|
|
"supported": False,
|
|
"help_output": None,
|
|
"error": str(e),
|
|
"from_cache": False,
|
|
}
|
|
|
|
|
|
def print_sglang_kt_kernel_instructions() -> None:
|
|
"""Print instructions for installing the kvcache-ai fork of SGLang with kt-kernel support."""
|
|
from kt_kernel.cli.i18n import get_lang
|
|
|
|
lang = get_lang()
|
|
|
|
if lang == "zh":
|
|
instructions = """
|
|
[bold red]SGLang 不支持 kt-kernel[/bold red]
|
|
|
|
您当前安装的 SGLang 不包含 kt-kernel 支持。
|
|
kt-kernel 需要使用 kvcache-ai 维护的 SGLang 分支。
|
|
|
|
[bold]请按以下步骤重新安装:[/bold]
|
|
|
|
[cyan]1. 卸载当前的 SGLang:[/cyan]
|
|
pip uninstall sglang -y
|
|
|
|
[cyan]2. 安装 kvcache-ai 版本 (选择一种方式):[/cyan]
|
|
|
|
[bold]方式 A - 一键安装 (推荐):[/bold]
|
|
从 ktransformers 根目录运行: ./install.sh
|
|
|
|
[bold]方式 B - pip 安装:[/bold]
|
|
pip install sglang-kt
|
|
|
|
[dim]注意: 请确保在正确的 Python 环境中执行以上命令[/dim]
|
|
"""
|
|
else:
|
|
instructions = """
|
|
[bold red]SGLang does not support kt-kernel[/bold red]
|
|
|
|
Your current SGLang installation does not include kt-kernel support.
|
|
kt-kernel requires the kvcache-ai maintained fork of SGLang.
|
|
|
|
[bold]Please reinstall SGLang:[/bold]
|
|
|
|
[cyan]1. Uninstall current SGLang:[/cyan]
|
|
pip uninstall sglang -y
|
|
|
|
[cyan]2. Install the kvcache-ai fork (choose one):[/cyan]
|
|
|
|
[bold]Option A - One-click install (recommended):[/bold]
|
|
From the ktransformers root directory, run: ./install.sh
|
|
|
|
[bold]Option B - pip install:[/bold]
|
|
pip install sglang-kt
|
|
|
|
[dim]Note: Make sure to run these commands in the correct Python environment[/dim]
|
|
"""
|
|
console.print(instructions)
|