[Test] Remove VLLM_USE_V1 in accuracy test (#1739)

### What this PR does / why we need it?
Remove VLLM_USE_V1 in accuracy test

Signed-off-by: hfadzxy <starmoon_zhang@163.com>
This commit is contained in:
zhangxinyuehfad
2025-07-11 15:29:11 +08:00
committed by GitHub
parent ee40d3d850
commit 1cd27da5fb
2 changed files with 4 additions and 9 deletions

View File

@@ -90,7 +90,6 @@ jobs:
}} }}
strategy: strategy:
matrix: matrix:
vllm_use_version: [1]
# the accuracy test will run: # the accuracy test will run:
# 1. workflow_dispatch with models input # 1. workflow_dispatch with models input
# - all: Qwen/Qwen3-30B-A3B, Qwen/Qwen2.5-VL-7B-Instruct, Qwen/Qwen3-8B-Base # - all: Qwen/Qwen3-30B-A3B, Qwen/Qwen2.5-VL-7B-Instruct, Qwen/Qwen3-8B-Base
@@ -122,7 +121,7 @@ jobs:
) }} ) }}
fail-fast: false fail-fast: false
name: ${{ matrix.model_name }} accuracy V${{ matrix.vllm_use_version }} name: ${{ matrix.model_name }} accuracy
container: container:
image: m.daocloud.io/quay.io/ascend/cann:8.1.rc1-910b-ubuntu22.04-py3.10 image: m.daocloud.io/quay.io/ascend/cann:8.1.rc1-910b-ubuntu22.04-py3.10
env: env:
@@ -236,15 +235,14 @@ jobs:
echo "vLLM: ${{ env.GHA_VLLM_VERSION }}" echo "vLLM: ${{ env.GHA_VLLM_VERSION }}"
echo "vLLM Ascend: ${{ env.GHA_VLLM_ASCEND_VERSION }}" echo "vLLM Ascend: ${{ env.GHA_VLLM_ASCEND_VERSION }}"
- name: Run Accuracy Test for V${{ matrix.vllm_use_version }} - name: Run Accuracy Test
id: report id: report
working-directory: ./benchmarks working-directory: ./benchmarks
env: env:
PYTORCH_NPU_ALLOC_CONF: max_split_size_mb:256 PYTORCH_NPU_ALLOC_CONF: max_split_size_mb:256
VLLM_USE_V1: ${{ matrix.vllm_use_version }}
run: | run: |
model_base_name=$(basename ${{ matrix.model_name }}) model_base_name=$(basename ${{ matrix.model_name }})
markdown_name="${model_base_name}-V${{ matrix.vllm_use_version }}" markdown_name="${model_base_name}"
echo "markdown_name=$markdown_name" echo "markdown_name=$markdown_name"
echo "markdown_name=$markdown_name" >> $GITHUB_OUTPUT echo "markdown_name=$markdown_name" >> $GITHUB_OUTPUT
mkdir -p ./accuracy mkdir -p ./accuracy
@@ -259,7 +257,6 @@ jobs:
--vllm_version "${{ env.GHA_VLLM_VERSION }}" \ --vllm_version "${{ env.GHA_VLLM_VERSION }}" \
--vllm_commit "${{ env.VLLM_COMMIT }}" \ --vllm_commit "${{ env.VLLM_COMMIT }}" \
--vllm_ascend_commit "${{ env.VLLM_ASCEND_COMMIT }}" \ --vllm_ascend_commit "${{ env.VLLM_ASCEND_COMMIT }}" \
--vllm_use_v1 "$VLLM_USE_V1"
- name: Generate step summary - name: Generate step summary
if: ${{ always() }} if: ${{ always() }}
@@ -282,7 +279,7 @@ jobs:
echo "contains_fail=false" >> $GITHUB_OUTPUT echo "contains_fail=false" >> $GITHUB_OUTPUT
fi fi
- name: Upload Report for V${{ matrix.vllm_use_version }} - name: Upload Report
if: ${{ github.event_name == 'workflow_dispatch' && steps.check_report.outputs.contains_fail == 'false' }} if: ${{ github.event_name == 'workflow_dispatch' && steps.check_report.outputs.contains_fail == 'false' }}
uses: actions/upload-artifact@v4 uses: actions/upload-artifact@v4
with: with:

View File

@@ -168,7 +168,6 @@ def generate_md(model_name, tasks_list, args, datasets):
**Software Environment**: CANN: {args.cann_version}, PyTorch: {args.torch_version}, torch-npu: {args.torch_npu_version} **Software Environment**: CANN: {args.cann_version}, PyTorch: {args.torch_version}, torch-npu: {args.torch_npu_version}
**Hardware Environment**: Atlas A2 Series **Hardware Environment**: Atlas A2 Series
**Datasets**: {datasets} **Datasets**: {datasets}
**vLLM Engine**: V{args.vllm_use_v1}
**Parallel Mode**: {PARALLEL_MODE[model_name]} **Parallel Mode**: {PARALLEL_MODE[model_name]}
**Execution Mode**: {EXECUTION_MODE[model_name]} **Execution Mode**: {EXECUTION_MODE[model_name]}
**Command**: **Command**:
@@ -310,6 +309,5 @@ if __name__ == "__main__":
parser.add_argument("--cann_version", type=str, required=False) parser.add_argument("--cann_version", type=str, required=False)
parser.add_argument("--vllm_commit", type=str, required=False) parser.add_argument("--vllm_commit", type=str, required=False)
parser.add_argument("--vllm_ascend_commit", type=str, required=False) parser.add_argument("--vllm_ascend_commit", type=str, required=False)
parser.add_argument("--vllm_use_v1", type=str, required=False)
args = parser.parse_args() args = parser.parse_args()
main(args) main(args)