[Test] Add accuracy nightly test for new models (#4262)

### What this PR does / why we need it?
Add accuracy nightly test for new models:

PaddlePaddle/ERNIE-4.5-21B-A3B-PT
LLM-Research/Molmo-7B-D-0924
LLM-Research/gemma-2-9b-it
LLM-Research/gemma-3-4b-it
Shanghai_AI_Laboratory/internlm-7b
llava-hf/llava-1.5-7b-hf

- vLLM version: v0.11.2

Signed-off-by: hfadzxy <starmoon_zhang@163.com>
This commit is contained in:
zhangxinyuehfad
2025-12-01 22:28:46 +08:00
committed by GitHub
parent 8e7f5cff6d
commit b6afec73e1
11 changed files with 97 additions and 4 deletions

View File

@@ -59,7 +59,7 @@ jobs:
name: ${{inputs.model_list}} accuracy test
runs-on: ${{ inputs.runner }}
container:
image: swr.cn-southwest-2.myhuaweicloud.com/base_image/ascend-ci/cann:8.3.rc2-910b-ubuntu22.04-py3.11
image: "${{ inputs.image }}"
env:
VLLM_USE_MODELSCOPE: True
GHA_VLLM_ASCEND_VERSION: ${{ inputs.vllm-ascend }}
@@ -111,6 +111,12 @@ jobs:
. /usr/local/Ascend/ascend-toolkit/8.3.RC2/bisheng_toolkit/set_env.sh
python3 -m pip install "https://vllm-ascend.obs.cn-north-4.myhuaweicloud.com/vllm-ascend/triton_ascend-3.2.0.dev2025110717-cp311-cp311-manylinux_2_27_aarch64.whl"
- name: Install tensorflow (for Molmo-7B-D-0924)
if: ${{ inputs.runner == 'linux-aarch64-a2-1' && contains(inputs.model_list, 'Molmo-7B-D-0924') }}
shell: bash -l {0}
run: |
pip install tensorflow --no-cache-dir
- name: Resolve vllm-ascend version
run: |
VERSION_INPUT="${{ inputs.vllm-ascend }}"
@@ -172,6 +178,7 @@ jobs:
id: report
env:
VLLM_WORKER_MULTIPROC_METHOD: spawn
HF_DATASETS_OFFLINE: True
VLLM_USE_MODELSCOPE: True
VLLM_CI_RUNNER: ${{ inputs.runner }}
VLLM_VERSION: ${{ env.GHA_VLLM_VERSION }}

View File

@@ -114,6 +114,15 @@ jobs:
- Qwen3-VL-8B-Instruct
- Qwen2.5-Omni-7B
- Meta-Llama-3.1-8B-Instruct
- os: linux-aarch64-a2-1
model_list:
- ERNIE-4.5-21B-A3B-PT
- gemma-2-9b-it
- gemma-3-4b-it
- internlm-7b
- InternVL3_5-8B-hf
- llava-1.5-7b-hf
- Molmo-7B-D-0924
- os: linux-aarch64-a2-2
model_list:
- Qwen3-30B-A3B
@@ -128,5 +137,5 @@ jobs:
vllm: v0.11.2
runner: ${{ matrix.test_config.os }}
model_list: ${{ toJson(matrix.test_config.model_list) }}
image: swr.cn-southwest-2.myhuaweicloud.com/base_image/ascend-ci/cann:8.2.rc1-910b-ubuntu22.04-py3.11
image: 'swr.cn-southwest-2.myhuaweicloud.com/base_image/ascend-ci/cann:8.3.rc2-910b-ubuntu22.04-py3.11'
upload: false