mirror of
https://github.com/kvcache-ai/sglang.git
synced 2026-06-30 03:37:51 +00:00
Merge pull request #36 from kvcache-ai/release/post1-transformers-kt-dep-20260430
fix: align sglang kt post1 deps and fp8 alias
This commit is contained in:
@@ -70,7 +70,7 @@ dependencies = [
|
||||
"torchcodec==0.8.0 ; sys_platform != 'linux' or (sys_platform == 'linux' and platform_machine != 'aarch64' and platform_machine != 'arm64' and platform_machine != 'armv7l')", # torchcodec does not exist in those systems. If not provided, transformer will use torchvision instead by default.
|
||||
"torchvision==0.24.1",
|
||||
"tqdm",
|
||||
"transformers==4.57.1",
|
||||
"transformers-kt==5.6.0.post1",
|
||||
"uvicorn",
|
||||
"uvloop",
|
||||
"xgrammar==0.1.27",
|
||||
|
||||
@@ -5283,6 +5283,7 @@ class ServerArgs:
|
||||
assert (
|
||||
self.tp_size * self.pp_size
|
||||
) % self.nnodes == 0, "tp_size must be divisible by number of nodes"
|
||||
self.normalize_kt_method_aliases()
|
||||
|
||||
if self.pp_size > 1:
|
||||
assert (
|
||||
@@ -5411,6 +5412,26 @@ class ServerArgs:
|
||||
"When enabling two batch overlap, moe_a2a_backend cannot be 'none'."
|
||||
)
|
||||
|
||||
def normalize_kt_method_aliases(self):
|
||||
if self.kt_method is None:
|
||||
return
|
||||
|
||||
kt_method_aliases = {
|
||||
"RAWFP8": "FP8",
|
||||
}
|
||||
normalized_method = kt_method_aliases.get(self.kt_method)
|
||||
if normalized_method is None:
|
||||
return
|
||||
|
||||
logger.warning(
|
||||
"--kt-method %s is deprecated; using %s. "
|
||||
"Use --kt-method %s in new scripts.",
|
||||
self.kt_method,
|
||||
normalized_method,
|
||||
normalized_method,
|
||||
)
|
||||
self.kt_method = normalized_method
|
||||
|
||||
def check_torch_2_9_1_cudnn_compatibility(self):
|
||||
if get_bool_env_var("SGLANG_DISABLE_CUDNN_CHECK"):
|
||||
return
|
||||
|
||||
Reference in New Issue
Block a user