chore(gb200): update dockerfile to handle fp4 disaggregation (#8694)
This commit is contained in:
@@ -53,12 +53,10 @@ RUN mkdir -p /tmp/gdrcopy && cd /tmp \
|
|||||||
RUN ln -sf /usr/lib/$(uname -m)-linux-gnu/libmlx5.so.1 /usr/lib/$(uname -m)-linux-gnu/libmlx5.so
|
RUN ln -sf /usr/lib/$(uname -m)-linux-gnu/libmlx5.so.1 /usr/lib/$(uname -m)-linux-gnu/libmlx5.so
|
||||||
|
|
||||||
# Clone and install SGLang
|
# Clone and install SGLang
|
||||||
# NOTE: flashinfer v0.2.9rc1 is not installing for aarch64
|
|
||||||
WORKDIR /sgl-workspace
|
WORKDIR /sgl-workspace
|
||||||
RUN python3 -m pip install --no-cache-dir --upgrade pip setuptools wheel html5lib six \
|
RUN python3 -m pip install --no-cache-dir --upgrade pip setuptools wheel html5lib six \
|
||||||
&& git clone https://github.com/sgl-project/sglang.git \
|
&& git clone --depth 1 https://github.com/sgl-project/sglang.git \
|
||||||
&& cd sglang \
|
&& cd sglang \
|
||||||
&& git checkout a167fd0bcb9ef4b0f4331a109e40c8cdc770b026 \
|
|
||||||
&& case "$CUDA_VERSION" in \
|
&& case "$CUDA_VERSION" in \
|
||||||
12.6.1) CUINDEX=126 ;; \
|
12.6.1) CUINDEX=126 ;; \
|
||||||
12.8.1) CUINDEX=128 ;; \
|
12.8.1) CUINDEX=128 ;; \
|
||||||
@@ -93,7 +91,7 @@ RUN wget https://developer.download.nvidia.com/compute/redist/nvshmem/3.3.9/sour
|
|||||||
# Python tools
|
# Python tools
|
||||||
RUN python3 -m pip install --no-cache-dir \
|
RUN python3 -m pip install --no-cache-dir \
|
||||||
datamodel_code_generator \
|
datamodel_code_generator \
|
||||||
mooncake_transfer_engine==0.3.5 \
|
mooncake-transfer-engine==0.3.5 \
|
||||||
pre-commit \
|
pre-commit \
|
||||||
pytest \
|
pytest \
|
||||||
black \
|
black \
|
||||||
@@ -103,6 +101,15 @@ RUN python3 -m pip install --no-cache-dir \
|
|||||||
wheel \
|
wheel \
|
||||||
scikit-build-core
|
scikit-build-core
|
||||||
|
|
||||||
|
# These will be automatically installed by future versions of flashinfer after 0.2.9rc2
|
||||||
|
RUN python3 -m pip install --no-cache-dir \
|
||||||
|
nvidia-cudnn-cu12 \
|
||||||
|
nvidia-cudnn-frontend
|
||||||
|
|
||||||
|
# Allows for FP4 disaggregation
|
||||||
|
RUN python3 -m pip install --no-cache-dir \
|
||||||
|
nixl
|
||||||
|
|
||||||
# Install development tools and utilities
|
# Install development tools and utilities
|
||||||
RUN apt-get update && apt-get install -y \
|
RUN apt-get update && apt-get install -y \
|
||||||
gdb \
|
gdb \
|
||||||
|
|||||||
Reference in New Issue
Block a user