Upgrade vLLM version to v0.9.2 (#1652)
### What this PR does / why we need it?
This patch upgrade vLLM version to v0.9.2, this patch didn't remove the
v0.9.1 compatible code to easy review.
### Does this PR introduce _any_ user-facing change?
No
### How was this patch tested?
- vLLM version: v0.9.1
- vLLM main:
14601f5fba
- Accuracy test with 0.9.2:
https://github.com/vllm-project/vllm-ascend/actions/runs/16121612087
Signed-off-by: Yikun Jiang <yikunkero@gmail.com>
This commit is contained in:
3
.github/workflows/accuracy_test.yaml
vendored
3
.github/workflows/accuracy_test.yaml
vendored
@@ -37,6 +37,7 @@ on:
|
||||
# Current supported vLLM versions
|
||||
options:
|
||||
- main
|
||||
- v0.9.2
|
||||
- v0.9.1
|
||||
- v0.7.3
|
||||
vllm-ascend-version:
|
||||
@@ -163,7 +164,7 @@ jobs:
|
||||
repository: vllm-project/vllm
|
||||
path: ./vllm-empty
|
||||
# Please also update this when bump matched version
|
||||
ref: ${{ github.event.inputs.vllm-version || 'v0.9.1' }}
|
||||
ref: ${{ github.event.inputs.vllm-version || 'v0.9.2' }}
|
||||
|
||||
- name: Install vllm-project/vllm from source
|
||||
working-directory: ./vllm-empty
|
||||
|
||||
2
.github/workflows/nightly_benchmarks.yaml
vendored
2
.github/workflows/nightly_benchmarks.yaml
vendored
@@ -50,7 +50,7 @@ jobs:
|
||||
strategy:
|
||||
matrix:
|
||||
include:
|
||||
- vllm_branch: v0.9.1
|
||||
- vllm_branch: v0.9.2
|
||||
vllm_ascend_branch: main
|
||||
vllm_use_v1: 1
|
||||
max-parallel: 1
|
||||
|
||||
8
.github/workflows/vllm_ascend_test.yaml
vendored
8
.github/workflows/vllm_ascend_test.yaml
vendored
@@ -138,13 +138,13 @@ jobs:
|
||||
if: ${{ needs.lint.result == 'success' || github.event_name == 'push' }}
|
||||
runs-on: ubuntu-latest
|
||||
container:
|
||||
image: m.daocloud.io/quay.io/ascend/cann:8.1.rc1-910b-ubuntu22.04-py3.10
|
||||
image: quay.io/ascend/cann:8.1.rc1-910b-ubuntu22.04-py3.10
|
||||
env:
|
||||
VLLM_LOGGING_LEVEL: ERROR
|
||||
VLLM_USE_MODELSCOPE: True
|
||||
strategy:
|
||||
matrix:
|
||||
vllm_version: [main, v0.9.1]
|
||||
vllm_version: [main, v0.9.2]
|
||||
steps:
|
||||
- name: Install packages
|
||||
run: |
|
||||
@@ -201,7 +201,7 @@ jobs:
|
||||
max-parallel: 2
|
||||
matrix:
|
||||
os: [linux-arm64-npu-1]
|
||||
vllm_version: [main, v0.9.1]
|
||||
vllm_version: [main, v0.9.2]
|
||||
name: singlecard e2e test
|
||||
runs-on: ${{ matrix.os }}
|
||||
container:
|
||||
@@ -302,7 +302,7 @@ jobs:
|
||||
max-parallel: 1
|
||||
matrix:
|
||||
os: [linux-arm64-npu-4]
|
||||
vllm_version: [main, v0.9.1]
|
||||
vllm_version: [main, v0.9.2]
|
||||
name: multicard e2e test
|
||||
runs-on: ${{ matrix.os }}
|
||||
container:
|
||||
|
||||
@@ -43,7 +43,7 @@ jobs:
|
||||
max-parallel: 2
|
||||
matrix:
|
||||
os: [linux-arm64-npu-1, linux-arm64-npu-4]
|
||||
vllm_version: [main, v0.9.1]
|
||||
vllm_version: [main, v0.9.2]
|
||||
name: vLLM Ascend long term test
|
||||
runs-on: ${{ matrix.os }}
|
||||
container:
|
||||
|
||||
Reference in New Issue
Block a user