From b6e0cfb5e1c355f9526defdf9bbee430c0bfebaa Mon Sep 17 00:00:00 2001 From: kk <43161300+kkHuang-amd@users.noreply.github.com> Date: Wed, 1 Jan 2025 12:12:19 +0800 Subject: [PATCH] ROCm base image update (#2692) Co-authored-by: wunhuang --- docker/Dockerfile.rocm | 8 +++++++- python/pyproject.toml | 2 +- 2 files changed, 8 insertions(+), 2 deletions(-) diff --git a/docker/Dockerfile.rocm b/docker/Dockerfile.rocm index c416a4b1b..84ea69cc0 100644 --- a/docker/Dockerfile.rocm +++ b/docker/Dockerfile.rocm @@ -2,7 +2,7 @@ # docker build --build-arg SGL_BRANCH=v0.4.1.post3 -t v0.4.1.post3-rocm620 -f Dockerfile.rocm . # default base image -ARG BASE_IMAGE="rocm/vllm-dev:20241022" +ARG BASE_IMAGE="rocm/vllm-dev:20241031-tuned" FROM $BASE_IMAGE AS base USER root @@ -33,6 +33,12 @@ RUN git clone ${SGL_REPO} \ RUN cp -r /sgl-workspace/sglang /sglang RUN python -m pip cache purge +RUN pip install IPython \ + && pip install orjson \ + && pip install python-multipart \ + && pip install torchao \ + && pip install pybind11 + RUN pip uninstall -y triton RUN git clone ${TRITON_REPO} \ && cd triton \ diff --git a/python/pyproject.toml b/python/pyproject.toml index c51e21f50..b59f334e6 100644 --- a/python/pyproject.toml +++ b/python/pyproject.toml @@ -27,7 +27,7 @@ srt = ["sglang[runtime_common]", "torch", "vllm>=0.6.3.post1,<=0.6.4.post1", "cu # HIP (Heterogeneous-computing Interface for Portability) for AMD # => base docker rocm/vllm-dev:20241022, not from public vllm whl -srt_hip = ["sglang[runtime_common]", "torch", "vllm==0.6.3.dev13"] +srt_hip = ["sglang[runtime_common]", "torch", "vllm==0.6.3.post2.dev1"] # xpu is not enabled in public vllm and torch whl, # need to follow https://docs.vllm.ai/en/latest/getting_started/xpu-installation.htmlinstall vllm srt_xpu = ["sglang[runtime_common]"]