Merge pull request #36 from kvcache-ai/release/post1-transformers-kt-dep-20260430

fix: align sglang kt post1 deps and fp8 alias
This commit is contained in:
Peilin Li
2026-04-30 02:47:11 +08:00
committed by GitHub
2 changed files with 22 additions and 1 deletions

View File

@@ -70,7 +70,7 @@ dependencies = [
"torchcodec==0.8.0 ; sys_platform != 'linux' or (sys_platform == 'linux' and platform_machine != 'aarch64' and platform_machine != 'arm64' and platform_machine != 'armv7l')", # torchcodec does not exist in those systems. If not provided, transformer will use torchvision instead by default.
"torchvision==0.24.1",
"tqdm",
"transformers==4.57.1",
"transformers-kt==5.6.0.post1",
"uvicorn",
"uvloop",
"xgrammar==0.1.27",

View File

@@ -5283,6 +5283,7 @@ class ServerArgs:
assert (
self.tp_size * self.pp_size
) % self.nnodes == 0, "tp_size must be divisible by number of nodes"
self.normalize_kt_method_aliases()
if self.pp_size > 1:
assert (
@@ -5411,6 +5412,26 @@ class ServerArgs:
"When enabling two batch overlap, moe_a2a_backend cannot be 'none'."
)
def normalize_kt_method_aliases(self):
if self.kt_method is None:
return
kt_method_aliases = {
"RAWFP8": "FP8",
}
normalized_method = kt_method_aliases.get(self.kt_method)
if normalized_method is None:
return
logger.warning(
"--kt-method %s is deprecated; using %s. "
"Use --kt-method %s in new scripts.",
self.kt_method,
normalized_method,
normalized_method,
)
self.kt_method = normalized_method
def check_torch_2_9_1_cudnn_compatibility(self):
if get_bool_env_var("SGLANG_DISABLE_CUDNN_CHECK"):
return