diff --git a/docker/Dockerfile.blackwell b/docker/Dockerfile.blackwell new file mode 100644 index 000000000..a261706f7 --- /dev/null +++ b/docker/Dockerfile.blackwell @@ -0,0 +1,19 @@ +ARG CUDA_VERSION=12.8.1 + +FROM pytorch/manylinux2_28-builder:cuda12.8 + +ARG BUILD_TYPE=all +ENV DEBIAN_FRONTEND=noninteractive + +WORKDIR /sgl-workspace + +RUN pip3 install --pre torch torchvision torchaudio --index-url https://download.pytorch.org/whl/nightly/cu128 + +RUN pip3 install nvidia-nccl-cu12==2.26.2.post1 \ + && pip3 install https://github.com/sgl-project/whl/releases/download/v0.0.8.post1/sgl_kernel-0.0.8.post1+cu128-cp39-abi3-manylinux2014_x86_64.whl \ + && pip3 install setuptools==75.0.0 wheel==0.41.0 scikit-build-core + +RUN git clone --depth=1 https://github.com/sgl-project/sglang.git \ + && pip3 install -e "python[blackwell]" + +ENV DEBIAN_FRONTEND=interactive diff --git a/python/pyproject.toml b/python/pyproject.toml index 11ee0ed1b..cbeb42163 100644 --- a/python/pyproject.toml +++ b/python/pyproject.toml @@ -57,6 +57,17 @@ srt = [ "einops", ] +blackwell = [ + "sglang[runtime_common]", + "sgl-kernel", + "torch", + "torchvision", + "cuda-python", + "outlines>=0.0.44,<=0.1.11", + "partial_json_parser", + "einops", +] + # HIP (Heterogeneous-computing Interface for Portability) for AMD # => base docker rocm/vllm-dev:20250114, not from public vllm whl srt_hip = [