chore: update Dockerfile (#8872)
Co-authored-by: zhyncs <me@zhyncs.com>
This commit is contained in:
@@ -14,7 +14,7 @@ ENV PATH="${PATH}:/usr/local/nvidia/bin" \
|
|||||||
|
|
||||||
RUN apt update && apt install wget -y && apt install software-properties-common -y \
|
RUN apt update && apt install wget -y && apt install software-properties-common -y \
|
||||||
&& add-apt-repository ppa:deadsnakes/ppa -y \
|
&& add-apt-repository ppa:deadsnakes/ppa -y \
|
||||||
&& apt install python3.12-full -y \
|
&& apt install python3.12-full python3.12-dev python3.10-venv -y \
|
||||||
&& update-alternatives --install /usr/bin/python3 python3 /usr/bin/python3.10 1 \
|
&& update-alternatives --install /usr/bin/python3 python3 /usr/bin/python3.10 1 \
|
||||||
&& update-alternatives --install /usr/bin/python3 python3 /usr/bin/python3.12 2 \
|
&& update-alternatives --install /usr/bin/python3 python3 /usr/bin/python3.12 2 \
|
||||||
&& update-alternatives --set python3 /usr/bin/python3.12 \
|
&& update-alternatives --set python3 /usr/bin/python3.12 \
|
||||||
@@ -28,7 +28,6 @@ RUN echo 'tzdata tzdata/Areas select America' | debconf-set-selections \
|
|||||||
tzdata \
|
tzdata \
|
||||||
software-properties-common netcat-openbsd kmod unzip openssh-server \
|
software-properties-common netcat-openbsd kmod unzip openssh-server \
|
||||||
curl wget lsof zsh ccache tmux htop git-lfs tree \
|
curl wget lsof zsh ccache tmux htop git-lfs tree \
|
||||||
python3 python3-pip python3-dev libpython3-dev python3-venv \
|
|
||||||
build-essential cmake \
|
build-essential cmake \
|
||||||
libopenmpi-dev libnuma1 libnuma-dev \
|
libopenmpi-dev libnuma1 libnuma-dev \
|
||||||
libibverbs-dev libibverbs1 libibumad3 \
|
libibverbs-dev libibverbs1 libibumad3 \
|
||||||
@@ -44,7 +43,7 @@ RUN echo 'tzdata tzdata/Areas select America' | debconf-set-selections \
|
|||||||
patchelf \
|
patchelf \
|
||||||
nvidia-dkms-550 \
|
nvidia-dkms-550 \
|
||||||
devscripts debhelper fakeroot dkms check libsubunit0 libsubunit-dev \
|
devscripts debhelper fakeroot dkms check libsubunit0 libsubunit-dev \
|
||||||
&& ln -sf /usr/bin/python3 /usr/bin/python \
|
&& ln -sf /usr/bin/python3.12 /usr/bin/python \
|
||||||
&& rm -rf /var/lib/apt/lists/* \
|
&& rm -rf /var/lib/apt/lists/* \
|
||||||
&& apt-get clean
|
&& apt-get clean
|
||||||
|
|
||||||
@@ -67,12 +66,16 @@ RUN python3 -m pip install --no-cache-dir --upgrade pip setuptools wheel html5li
|
|||||||
&& case "$CUDA_VERSION" in \
|
&& case "$CUDA_VERSION" in \
|
||||||
12.6.1) CUINDEX=126 ;; \
|
12.6.1) CUINDEX=126 ;; \
|
||||||
12.8.1) CUINDEX=128 ;; \
|
12.8.1) CUINDEX=128 ;; \
|
||||||
|
12.9.1) CUINDEX=129 ;; \
|
||||||
*) echo "Unsupported CUDA version: $CUDA_VERSION" && exit 1 ;; \
|
*) echo "Unsupported CUDA version: $CUDA_VERSION" && exit 1 ;; \
|
||||||
esac \
|
esac \
|
||||||
&& python3 -m pip install --no-cache-dir -e "python[${BUILD_TYPE}]" --extra-index-url https://download.pytorch.org/whl/cu${CUINDEX} \
|
&& python3 -m pip install --no-cache-dir -e "python[${BUILD_TYPE}]" --extra-index-url https://download.pytorch.org/whl/test/cu${CUINDEX} \
|
||||||
&& python3 -m pip install --no-cache-dir nvidia-nccl-cu12==2.27.6 --force-reinstall --no-deps \
|
&& python3 -m pip install --no-cache-dir nvidia-nccl-cu12==2.27.6 --force-reinstall --no-deps \
|
||||||
&& if [ "$CUDA_VERSION" = "12.8.1" ]; then \
|
&& if [ "$CUDA_VERSION" = "12.8.1" ]; then \
|
||||||
python3 -m pip install --no-cache-dir https://github.com/sgl-project/whl/releases/download/v0.2.9/sgl_kernel-0.2.9+cu128-cp39-abi3-manylinux2014_x86_64.whl --force-reinstall --no-deps ; \
|
python3 -m pip install --no-cache-dir https://github.com/sgl-project/whl/releases/download/v0.3.2/sgl_kernel-0.3.2+cu128-cp39-abi3-manylinux2014_x86_64.whl --force-reinstall --no-deps ; \
|
||||||
|
fi \
|
||||||
|
&& if [ "$CUDA_VERSION" = "12.9.1" ]; then \
|
||||||
|
python3 -m pip install --no-cache-dir https://github.com/sgl-project/whl/releases/download/v0.3.2/sgl_kernel-0.3.2-cp39-abi3-manylinux2014_x86_64.whl --force-reinstall --no-deps ; \
|
||||||
fi
|
fi
|
||||||
|
|
||||||
# Build and install NVSHMEM + DeepEP
|
# Build and install NVSHMEM + DeepEP
|
||||||
|
|||||||
Reference in New Issue
Block a user