Bump vLLM version to v0.10.2 (#2914)

### What this PR does / why we need it? Bump vLLM version to v0.10.2 ### Does this PR introduce _any_ user-facing change? No ### How was this patch tested? CI passed - vLLM version: v0.10.2rc3 - vLLM main: 15b8fef453 Signed-off-by: Yikun Jiang <yikunkero@gmail.com>
2025-09-14 06:57:59 +08:00
parent f97a64ba7f
commit 0747a6e68c
13 changed files with 16 additions and 16 deletions
--- a/.github/workflows/accuracy_test.yaml
+++ b/.github/workflows/accuracy_test.yaml
@@ -112,7 +112,7 @@ jobs:
        uses: actions/checkout@v4
        with:
          repository: vllm-project/vllm
-          ref: v0.10.2rc3
+          ref: v0.10.2
          path: ./vllm-empty
      - name: Install vllm-project/vllm from source
--- a/.github/workflows/nightly_benchmarks.yaml
+++ b/.github/workflows/nightly_benchmarks.yaml
@@ -51,7 +51,7 @@ jobs:
    strategy:
      matrix:
        include:
-          - vllm_branch: v0.10.2rc3
+          - vllm_branch: v0.10.2
            vllm_ascend_branch: main
            vllm_use_v1: 1
      max-parallel: 1
--- a/.github/workflows/vllm_ascend_dist.yaml
+++ b/.github/workflows/vllm_ascend_dist.yaml
@@ -43,7 +43,7 @@ jobs:
    strategy:
      matrix:
        os: [linux-aarch64-a3-8]
-        vllm_version: [v0.10.2rc3]
+        vllm_version: [v0.10.2]
    name: vLLM Ascend test
    runs-on: ${{ matrix.os }}
    container:
--- a/.github/workflows/vllm_ascend_test.yaml
+++ b/.github/workflows/vllm_ascend_test.yaml
@@ -82,7 +82,7 @@ jobs:
        VLLM_USE_MODELSCOPE: True
    strategy:
      matrix:
-        vllm_version: [v0.10.2rc3]
+        vllm_version: [v0.10.2]
    steps:
      - name: Install packages
        run: |
@@ -138,7 +138,7 @@ jobs:
      max-parallel: 2
      matrix:
        os: [linux-aarch64-a2-1]
-        vllm_version: [v0.10.2rc3]
+        vllm_version: [v0.10.2]
    name: singlecard e2e test - light
    runs-on: ${{ matrix.os }}
    container:
@@ -203,7 +203,7 @@ jobs:
      max-parallel: 2
      matrix:
        os: [linux-aarch64-a2-2]
-        vllm_version: [v0.10.2rc3]
+        vllm_version: [v0.10.2]
    name: multicard e2e test - light
    runs-on: ${{ matrix.os }}
    container:
--- a/.github/workflows/vllm_ascend_test_310p.yaml
+++ b/.github/workflows/vllm_ascend_test_310p.yaml
@@ -53,7 +53,7 @@ jobs:
      max-parallel: 2
      matrix:
        os: [linux-aarch64-310p-1, linux-aarch64-310p-4]
-        vllm_version: [v0.10.2rc3]
+        vllm_version: [v0.10.2]
    name: 310p e2e test
    runs-on: ${{ matrix.os }}
    container:
--- a/.github/workflows/vllm_ascend_test_full.yaml
+++ b/.github/workflows/vllm_ascend_test_full.yaml
@@ -72,7 +72,7 @@ jobs:
      max-parallel: 2
      matrix:
        os: [linux-aarch64-a2-1]
-        vllm_version: [v0.10.2rc3]
+        vllm_version: [v0.10.2]
    name: singlecard e2e test - full
    runs-on: ${{ matrix.os }}
    container:
@@ -156,7 +156,7 @@ jobs:
      max-parallel: 2
      matrix:
        os: [linux-aarch64-a2-2]
-        vllm_version: [v0.10.2rc3]
+        vllm_version: [v0.10.2]
    name: multicard e2e test - full
    runs-on: ${{ matrix.os }}
    container:
--- a/2
+++ b/2
@@ -37,7 +37,7 @@ RUN pip config set global.index-url ${PIP_INDEX_URL}
 # Install vLLM
 ARG VLLM_REPO=https://github.com/vllm-project/vllm.git
-ARG VLLM_TAG=v0.10.2rc3
+ARG VLLM_TAG=v0.10.2
 RUN git clone --depth 1 $VLLM_REPO --branch $VLLM_TAG /vllm-workspace/vllm
 # In x86, triton will be installed by vllm. But in Ascend, triton doesn't work correctly. we need to uninstall it.
 RUN VLLM_TARGET_DEVICE="empty" python3 -m pip install -v -e /vllm-workspace/vllm/ --extra-index https://download.pytorch.org/whl/cpu/ && \
--- a/Dockerfile.310p
+++ b/Dockerfile.310p
@@ -37,7 +37,7 @@ RUN pip config set global.index-url ${PIP_INDEX_URL}
 # Install vLLM
 ARG VLLM_REPO=https://github.com/vllm-project/vllm.git
-ARG VLLM_TAG=v0.10.2rc3
+ARG VLLM_TAG=v0.10.2
 RUN git clone --depth 1 $VLLM_REPO --branch $VLLM_TAG /vllm-workspace/vllm
 # In x86, triton will be installed by vllm. But in Ascend, triton doesn't work correctly. we need to uninstall it.
 RUN VLLM_TARGET_DEVICE="empty" python3 -m pip install -v -e /vllm-workspace/vllm/ --extra-index https://download.pytorch.org/whl/cpu/ && \
--- a/Dockerfile.310p.openEuler
+++ b/Dockerfile.310p.openEuler
@@ -34,7 +34,7 @@ COPY . /vllm-workspace/vllm-ascend/
 # Install vLLM
 ARG VLLM_REPO=https://github.com/vllm-project/vllm.git
-ARG VLLM_TAG=v0.10.2rc3
+ARG VLLM_TAG=v0.10.2
 RUN git clone --depth 1 $VLLM_REPO --branch $VLLM_TAG /vllm-workspace/vllm
 # In x86, triton will be installed by vllm. But in Ascend, triton doesn't work correctly. we need to uninstall it.
--- a/Dockerfile.a3
+++ b/Dockerfile.a3
@@ -37,7 +37,7 @@ RUN pip config set global.index-url ${PIP_INDEX_URL}
 # Install vLLM
 ARG VLLM_REPO=https://github.com/vllm-project/vllm.git
-ARG VLLM_TAG=v0.10.2rc3
+ARG VLLM_TAG=v0.10.2
 RUN git clone --depth 1 $VLLM_REPO --branch $VLLM_TAG /vllm-workspace/vllm
 # In x86, triton will be installed by vllm. But in Ascend, triton doesn't work correctly. we need to uninstall it.
 RUN VLLM_TARGET_DEVICE="empty" python3 -m pip install -v -e /vllm-workspace/vllm/ --extra-index https://download.pytorch.org/whl/cpu/ && \
--- a/Dockerfile.a3.openEuler
+++ b/Dockerfile.a3.openEuler
@@ -34,7 +34,7 @@ COPY . /vllm-workspace/vllm-ascend/
 # Install vLLM
 ARG VLLM_REPO=https://github.com/vllm-project/vllm.git
-ARG VLLM_TAG=v0.10.2rc3
+ARG VLLM_TAG=v0.10.2
 RUN git clone --depth 1 $VLLM_REPO --branch $VLLM_TAG /vllm-workspace/vllm
 # In x86, triton will be installed by vllm. But in Ascend, triton doesn't work correctly. we need to uninstall it.
--- a/Dockerfile.openEuler
+++ b/Dockerfile.openEuler
@@ -34,7 +34,7 @@ COPY . /vllm-workspace/vllm-ascend/
 # Install vLLM
 ARG VLLM_REPO=https://github.com/vllm-project/vllm.git
-ARG VLLM_TAG=v0.10.2rc3
+ARG VLLM_TAG=v0.10.2
 RUN git clone --depth 1 $VLLM_REPO --branch $VLLM_TAG /vllm-workspace/vllm
 # In x86, triton will be installed by vllm. But in Ascend, triton doesn't work correctly. we need to uninstall it.
--- a/docs/source/conf.py
+++ b/docs/source/conf.py
@@ -77,7 +77,7 @@ myst_substitutions = {
    # CANN image tag
    'cann_image_tag': "8.2.rc1-910b-ubuntu22.04-py3.11",
    # vllm version in ci
-    'ci_vllm_version': 'v0.10.2rc3',
+    'ci_vllm_version': 'v0.10.2',
 }
 # Add any paths that contain templates here, relative to this directory.