Support new DeepGEMM format in per token group quant (part 2: srt) (#7155)

This commit is contained in:
fzyzcjy
2025-06-14 05:25:40 +08:00
committed by GitHub
parent 8ab7d93c2e
commit bec3e48402
3 changed files with 19 additions and 4 deletions

View File

@@ -605,7 +605,7 @@ def _set_envs_and_config(server_args: ServerArgs):
if _is_cuda:
assert_pkg_version(
"sgl-kernel",
"0.1.7",
"0.1.8.post1",
"Please reinstall the latest version with `pip install sgl-kernel --force-reinstall`",
)