diff --git a/docker/Dockerfile b/docker/Dockerfile index 3b9a420b3..e9351ddae 100644 --- a/docker/Dockerfile +++ b/docker/Dockerfile @@ -85,7 +85,7 @@ RUN python3 -m pip install --no-cache-dir --upgrade pip setuptools wheel html5li && python3 -m pip install --no-cache-dir nvidia-nccl-cu12==2.27.6 --force-reinstall --no-deps \ && python3 -m flashinfer --download-cubin \ && if [ "$CUDA_VERSION" = "12.6.1" ]; then \ - python3 -m pip install --no-cache-dir https://github.com/sgl-project/whl/releases/download/v0.3.9.post2/sgl_kernel-0.3.9.post2+cu124-cp310-abi3-manylinux2014_x86_64.whl --force-reinstall --no-deps ; \ + python3 -m pip install --no-cache-dir https://github.com/sgl-project/whl/releases/download/v0.3.10/sgl_kernel-0.3.10+cu124-cp310-abi3-manylinux2014_x86_64.whl --force-reinstall --no-deps ; \ fi # Download source files diff --git a/docker/Dockerfile.gb200 b/docker/Dockerfile.gb200 index 7a7747ef0..c76ae8640 100644 --- a/docker/Dockerfile.gb200 +++ b/docker/Dockerfile.gb200 @@ -4,7 +4,7 @@ FROM nvidia/cuda:${CUDA_VERSION}-cudnn-devel-ubuntu22.04 ARG BUILD_TYPE=blackwell ARG DEEPEP_COMMIT=1b14ad661c7640137fcfe93cccb2694ede1220b0 ARG CMAKE_BUILD_PARALLEL_LEVEL=2 -ARG SGL_KERNEL_VERSION=0.3.9.post2 +ARG SGL_KERNEL_VERSION=0.3.10 ENV DEBIAN_FRONTEND=noninteractive \ CUDA_HOME=/usr/local/cuda \ GDRCOPY_HOME=/usr/src/gdrdrv-2.4.4/ \ diff --git a/python/pyproject.toml b/python/pyproject.toml index ee9b05861..d7a1a36ef 100755 --- a/python/pyproject.toml +++ b/python/pyproject.toml @@ -57,7 +57,7 @@ dependencies = [ "uvicorn", "uvloop", "xgrammar==0.1.24", - "sgl-kernel==0.3.9.post2", + "sgl-kernel==0.3.10", "torch==2.8.0", "torchaudio==2.8.0", "torchvision", @@ -67,10 +67,10 @@ dependencies = [ "tiktoken", "anthropic>=0.20.0", "torch_memory_saver==0.0.8", - "decord", ] [project.optional-dependencies] +decord = ["decord"] test = [ "accelerate", "expecttest", @@ -88,8 +88,8 @@ tracing = [ "opentelemetry-exporter-otlp", "opentelemetry-exporter-otlp-proto-grpc", ] -all = ["sglang[test]"] -blackwell = ["nvidia-cutlass-dsl==4.1.0", "sglang[test]"] +all = ["sglang[test]", "sglang[decord]"] +blackwell = ["nvidia-cutlass-dsl==4.2.0", "sglang[test]"] dev = ["sglang[test]"] [project.urls] diff --git a/python/pyproject_other.toml b/python/pyproject_other.toml index 670fb6cc9..59c8db0e5 100755 --- a/python/pyproject_other.toml +++ b/python/pyproject_other.toml @@ -65,7 +65,7 @@ tracing = [ srt = [ "sglang[runtime_common]", - "sgl-kernel==0.3.9.post2", + "sgl-kernel==0.3.10", "torch==2.8.0", "torchaudio==2.8.0", "torchvision", @@ -75,13 +75,13 @@ srt = [ blackwell = [ "sglang[runtime_common]", - "sgl-kernel==0.3.9.post2", + "sgl-kernel==0.3.10", "torch==2.8.0", "torchaudio==2.8.0", "torchvision", "cuda-python", "flashinfer_python==0.3.1", - "nvidia-cutlass-dsl==4.1.0", + "nvidia-cutlass-dsl==4.2.0", ] # HIP (Heterogeneous-computing Interface for Portability) for AMD diff --git a/python/sglang/srt/entrypoints/engine.py b/python/sglang/srt/entrypoints/engine.py index 390e0985a..71c3def5f 100644 --- a/python/sglang/srt/entrypoints/engine.py +++ b/python/sglang/srt/entrypoints/engine.py @@ -690,7 +690,7 @@ def _set_envs_and_config(server_args: ServerArgs): if _is_cuda and not get_bool_env_var("SGLANG_SKIP_SGL_KERNEL_VERSION_CHECK"): assert_pkg_version( "sgl-kernel", - "0.3.9.post2", + "0.3.10", "Please reinstall the latest version with `pip install sgl-kernel --force-reinstall`", )