diff --git a/docker/Dockerfile.blackwell b/docker/Dockerfile.blackwell index fefbde590..f65bd69f3 100644 --- a/docker/Dockerfile.blackwell +++ b/docker/Dockerfile.blackwell @@ -20,13 +20,13 @@ RUN echo 'tzdata tzdata/Areas select America' | debconf-set-selections \ RUN pip3 install torch==2.7.1 torchvision==0.22.1 torchaudio==2.7.1 --index-url https://download.pytorch.org/whl/cu128 --break-system-packages -RUN pip3 install https://github.com/sgl-project/whl/releases/download/v0.1.7/sgl_kernel-0.1.7+cu128-cp39-abi3-manylinux2014_x86_64.whl --break-system-packages \ +RUN pip3 install https://github.com/sgl-project/whl/releases/download/v0.1.8/sgl_kernel-0.1.8+cu128-cp39-abi3-manylinux2014_x86_64.whl --break-system-packages \ && pip3 install setuptools==75.0.0 wheel scikit-build-core --break-system-packages RUN git clone --depth=1 https://github.com/sgl-project/sglang.git \ && cd sglang && pip3 install -e "python[blackwell]" --break-system-packages -RUN pip3 install nvidia-nccl-cu12==2.26.2.post1 --force-reinstall --no-deps --break-system-packages +RUN pip3 install nvidia-nccl-cu12==2.27.3 --force-reinstall --no-deps --break-system-packages RUN pip3 install flashinfer_python==0.2.6.post1 --break-system-packages diff --git a/sgl-kernel/CMakeLists.txt b/sgl-kernel/CMakeLists.txt index 0e3daa3a4..4714ce4c8 100644 --- a/sgl-kernel/CMakeLists.txt +++ b/sgl-kernel/CMakeLists.txt @@ -39,6 +39,14 @@ find_package(Torch REQUIRED) # clean Torch Flag clear_cuda_arches(CMAKE_FLAG) +if("${CUDA_VERSION}" VERSION_EQUAL "12.8") + set(DeepGEMM_REPO "https://github.com/sgl-project/DeepGEMM") + set(DeepGEMM_TAG "blackwell") +else() + set(DeepGEMM_REPO "https://github.com/deepseek-ai/DeepGEMM") + set(DeepGEMM_TAG "8dfa3298274bfe6b242f6f8a3e6f3eff2707dd9f") +endif() + include(FetchContent) # cutlass @@ -52,8 +60,8 @@ FetchContent_Populate(repo-cutlass) # DeepGEMM FetchContent_Declare( repo-deepgemm - GIT_REPOSITORY https://github.com/deepseek-ai/DeepGEMM - GIT_TAG 8dfa3298274bfe6b242f6f8a3e6f3eff2707dd9f + GIT_REPOSITORY ${DeepGEMM_REPO} + GIT_TAG ${DeepGEMM_TAG} GIT_SHALLOW OFF ) FetchContent_Populate(repo-deepgemm) diff --git a/sgl-kernel/pyproject.toml b/sgl-kernel/pyproject.toml index ef059207c..f70807b65 100644 --- a/sgl-kernel/pyproject.toml +++ b/sgl-kernel/pyproject.toml @@ -8,7 +8,7 @@ build-backend = "scikit_build_core.build" [project] name = "sgl-kernel" -version = "0.1.7" +version = "0.1.8" description = "Kernel Library for SGLang" readme = "README.md" requires-python = ">=3.9" diff --git a/sgl-kernel/pyproject_cpu.toml b/sgl-kernel/pyproject_cpu.toml index a4482caee..522a739c0 100644 --- a/sgl-kernel/pyproject_cpu.toml +++ b/sgl-kernel/pyproject_cpu.toml @@ -8,7 +8,7 @@ build-backend = "scikit_build_core.build" [project] name = "sgl-kernel" -version = "0.1.7" +version = "0.1.8" description = "Kernel Library for SGLang" readme = "README.md" requires-python = ">=3.9" diff --git a/sgl-kernel/pyproject_rocm.toml b/sgl-kernel/pyproject_rocm.toml index 34abf9f92..043e26585 100644 --- a/sgl-kernel/pyproject_rocm.toml +++ b/sgl-kernel/pyproject_rocm.toml @@ -9,7 +9,7 @@ build-backend = "setuptools.build_meta" [project] name = "sgl-kernel" -version = "0.1.7" +version = "0.1.8" description = "Kernel Library for SGLang" readme = "README.md" requires-python = ">=3.9" diff --git a/sgl-kernel/python/sgl_kernel/version.py b/sgl-kernel/python/sgl_kernel/version.py index f1380eede..9cb17e797 100644 --- a/sgl-kernel/python/sgl_kernel/version.py +++ b/sgl-kernel/python/sgl_kernel/version.py @@ -1 +1 @@ -__version__ = "0.1.7" +__version__ = "0.1.8"