From 9970e3bf328a1f59d9a7f79613c7d620ca522068 Mon Sep 17 00:00:00 2001 From: Yineng Zhang Date: Sat, 30 Aug 2025 04:02:25 -0700 Subject: [PATCH] chore: upgrade sgl-kernel 0.3.7.post1 with deepgemm fix (#9822) --- docker/Dockerfile | 4 ++-- python/pyproject.toml | 2 +- python/sglang/srt/entrypoints/engine.py | 2 +- 3 files changed, 4 insertions(+), 4 deletions(-) diff --git a/docker/Dockerfile b/docker/Dockerfile index e08c77b0e..eb6cca3b9 100644 --- a/docker/Dockerfile +++ b/docker/Dockerfile @@ -85,10 +85,10 @@ RUN python3 -m pip install --no-cache-dir --upgrade pip setuptools wheel html5li && python3 -m pip install --no-cache-dir nvidia-nccl-cu12==2.27.6 --force-reinstall --no-deps \ && python3 -m flashinfer --download-cubin \ && if [ "$CUDA_VERSION" = "12.8.1" ]; then \ - python3 -m pip install --no-cache-dir https://github.com/sgl-project/whl/releases/download/v0.3.7/sgl_kernel-0.3.7+cu128-cp310-abi3-manylinux2014_x86_64.whl --force-reinstall --no-deps ; \ + python3 -m pip install --no-cache-dir https://github.com/sgl-project/whl/releases/download/v0.3.7.post1/sgl_kernel-0.3.7.post1+cu128-cp310-abi3-manylinux2014_x86_64.whl --force-reinstall --no-deps ; \ fi \ && if [ "$CUDA_VERSION" = "12.9.1" ]; then \ - python3 -m pip install --no-cache-dir https://github.com/sgl-project/whl/releases/download/v0.3.7/sgl_kernel-0.3.7+cu129-cp310-abi3-manylinux2014_x86_64.whl --force-reinstall --no-deps ; \ + python3 -m pip install --no-cache-dir https://github.com/sgl-project/whl/releases/download/v0.3.7.post1/sgl_kernel-0.3.7.post1+cu129-cp310-abi3-manylinux2014_x86_64.whl --force-reinstall --no-deps ; \ fi # Download source files diff --git a/python/pyproject.toml b/python/pyproject.toml index 4ff0015ca..f6ccffcfe 100644 --- a/python/pyproject.toml +++ b/python/pyproject.toml @@ -58,7 +58,7 @@ runtime_common = [ srt = [ "sglang[runtime_common]", - "sgl-kernel==0.3.7", + "sgl-kernel==0.3.7.post1", "torch==2.8.0", "torchaudio==2.8.0", "torchvision", diff --git a/python/sglang/srt/entrypoints/engine.py b/python/sglang/srt/entrypoints/engine.py index 3c2e87bd7..2b576b409 100644 --- a/python/sglang/srt/entrypoints/engine.py +++ b/python/sglang/srt/entrypoints/engine.py @@ -680,7 +680,7 @@ def _set_envs_and_config(server_args: ServerArgs): if _is_cuda and not get_bool_env_var("SGLANG_SKIP_SGL_KERNEL_VERSION_CHECK"): assert_pkg_version( "sgl-kernel", - "0.3.7", + "0.3.7.post1", "Please reinstall the latest version with `pip install sgl-kernel --force-reinstall`", )