[Test] add a new Qwen3-32b-int8 test case with feature_stack3 (#3676)
### What this PR does / why we need it? This PR add a new Qwen3-32b-int8 test case for nightly test. This test case mainly test the performance and accuracy of Qwen3-32b-int8 with a new feature. ### Does this PR introduce _any_ user-facing change? No ### How was this patch tested? By running the test. - vLLM version: v0.11.0rc3 - vLLM main: https://github.com/vllm-project/vllm/commit/v0.11.0 --------- Signed-off-by: root <root@hostname-2pbfv.foreman.pxe> Co-authored-by: root <root@hostname-2pbfv.foreman.pxe>
This commit is contained in:
11
.github/workflows/vllm_ascend_test_nightly.yaml
vendored
11
.github/workflows/vllm_ascend_test_nightly.yaml
vendored
@@ -98,6 +98,17 @@ jobs:
|
||||
runner: ${{ matrix.os }}
|
||||
image: swr.cn-southwest-2.myhuaweicloud.com/base_image/ascend-ci/cann:8.2.rc1-a3-ubuntu22.04-py3.11
|
||||
tests: tests/e2e/nightly/models/test_deepseek_r1_w8a8_eplb.py
|
||||
qwen3-32b-int8-a3-feature-stack3:
|
||||
if: contains(github.event.pull_request.labels.*.name, 'run-nightly')
|
||||
strategy:
|
||||
matrix:
|
||||
os: [ linux-aarch64-a3-4 ]
|
||||
uses: ./.github/workflows/_e2e_nightly.yaml
|
||||
with:
|
||||
vllm: v0.11.0
|
||||
runner: ${{ matrix.os }}
|
||||
image: swr.cn-southwest-2.myhuaweicloud.com/base_image/ascend-ci/cann:8.2.rc1-a3-ubuntu22.04-py3.11
|
||||
tests: tests/e2e/nightly/features/test_qwen3_32b_int8_a3_feature_stack3.py
|
||||
qwen2-5-vl-7b:
|
||||
if: contains(github.event.pull_request.labels.*.name, 'run-nightly')
|
||||
strategy:
|
||||
|
||||
Reference in New Issue
Block a user