[Test] Add accuracy test report workflow (#542)

### What this PR does / why we need it? 1. Provide accuracy test report for development branch release. 2. Models and datasets for accuracy test： | Model | datasets | |---------------------------- | --------------------------- | | Qwen2.5-7B-Instruct | ceval-val, gsm8k, mmlu | | Qwen3-8B | ceval-val, gsm8k, mmlu | | Llama-3.1-8B-Instruct | ceval-val, gsm8k, mmlu | | Qwen2.5-VL-7B-Instruct | mmmu_val | ### Does this PR introduce _any_ user-facing change? This PR will display the accuracy test report of the release versionin docs/source/developer_guide/accuracy_report。 Qwen2.5-7B-Instruct.md Qwen3-8B.md Llama-3.1-8B-Instruct.md Qwen2.5-VL-7B-Instruct .md Signed-off-by: hfadzxy <starmoon_zhang@163.com>
2025-04-30 14:53:58 +08:00
parent ba9714ccee
commit affca6f348
6 changed files with 587 additions and 2 deletions
--- a/.github/workflows/accuracy_report.yaml
+++ b/.github/workflows/accuracy_report.yaml
@@ -0,0 +1,150 @@
+#
+# Copyright (c) 2025 Huawei Technologies Co., Ltd. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# This file is a part of the vllm-ascend project.
+#
+
+name: Accuracy Report
+on:
+  workflow_dispatch:
+    inputs:
+      branch:
+        description: 'choose a dev branch to pr'
+        required: true
+      vllm-ascend-version:
+        description: 'what vllm-ascend version to accuracy test?'
+        required: true
+        type: string
+jobs:
+  download:
+    runs-on: ubuntu-latest
+    steps:
+      - name: Checkout repository
+        uses: actions/checkout@v4
+        with:
+          ref: ${{ github.event.inputs.branch }}
+
+      - name: Debug List Artifacts
+        run: gh api /repos/${{ github.repository }}/actions/artifacts
+        env:
+          GH_TOKEN: ${{ secrets.GITHUB_TOKEN }}
+
+      - name: Query artifact run id for Qwen2.5-VL-7B-Instruct V0 latest artifact
+        id: get_Qwen2_5_VL_7B_Instruct_latest_run_id_V0
+        run: |
+          ARTIFACT_JSON=$(gh api "repos/${{ github.repository }}/actions/artifacts")
+          RUN_ID=$(echo "$ARTIFACT_JSON" | \
+            jq -r '[.artifacts[] | select(.name=="${{ github.event.inputs.vllm-ascend-version }}-Qwen2.5-VL-7B-Instruct-V0-report")] | sort_by(.created_at) | last | .workflow_run.id')
+          echo "runid=$RUN_ID" >> "$GITHUB_OUTPUT"
+        env:
+          GH_TOKEN: ${{ secrets.GITHUB_TOKEN }}
+
+      - name: Query artifact run id for Qwen2.5-7B-Instruct V0 latest artifact
+        id: get_Qwen2_5_7B_Instruct_latest_run_id_V0
+        run: |
+          ARTIFACT_JSON=$(gh api "repos/${{ github.repository }}/actions/artifacts")
+          RUN_ID=$(echo "$ARTIFACT_JSON" | \
+            jq -r '[.artifacts[] | select(.name=="${{ github.event.inputs.vllm-ascend-version }}-Qwen2.5-7B-Instruct-V0-report")] | sort_by(.created_at) | last | .workflow_run.id')
+          echo "runid=$RUN_ID" >> "$GITHUB_OUTPUT"
+        env:
+          GH_TOKEN: ${{ secrets.GITHUB_TOKEN }}
+
+      - name: Query artifact run id for Llama-3.1-8B-Instruct V0 latest artifact
+        id: get_Llama_3_1_8B_Instruct_latest_run_id_V0
+        run: |
+          ARTIFACT_JSON=$(gh api "repos/${{ github.repository }}/actions/artifacts")
+          RUN_ID=$(echo "$ARTIFACT_JSON" | \
+            jq -r '[.artifacts[] | select(.name=="${{ github.event.inputs.vllm-ascend-version }}-Llama-3.1-8B-Instruct-V0-report")] | sort_by(.created_at) | last | .workflow_run.id')
+          echo "runid=$RUN_ID" >> "$GITHUB_OUTPUT"
+        env:
+          GH_TOKEN: ${{ secrets.GITHUB_TOKEN }}
+
+      - name: Query artifact run id for Qwen3-8B V0 latest artifact
+        id: get_Qwen3_8B_latest_run_id_V0
+        run: |
+          ARTIFACT_JSON=$(gh api "repos/${{ github.repository }}/actions/artifacts")
+          RUN_ID=$(echo "$ARTIFACT_JSON" | \
+            jq -r '[.artifacts[] | select(.name=="${{ github.event.inputs.vllm-ascend-version }}-Qwen3-8B-V0-report")] | sort_by(.created_at) | last | .workflow_run.id')
+          echo "runid=$RUN_ID" >> "$GITHUB_OUTPUT"
+        env:
+          GH_TOKEN: ${{ secrets.GITHUB_TOKEN }}
+
+      - name: Download Qwen/Qwen2.5-VL-7B-Instruct V0 Artifact
+        uses: actions/download-artifact@v4
+        with:
+          name: ${{ github.event.inputs.vllm-ascend-version }}-Qwen2.5-VL-7B-Instruct-V0-report
+          path: ./docs/source/developer_guide/evaluation/accuracy_report
+          github-token: ${{ secrets.GITHUB_TOKEN }}
+          repository: vllm-project/vllm-ascend
+          run-id: ${{ steps.get_Qwen2_5_VL_7B_Instruct_latest_run_id_V0.outputs.runid }}
+
+      - name: Download Qwen/Qwen2.5-7B-Instruct Artifact
+        uses: actions/download-artifact@v4
+        with:
+          name: ${{ github.event.inputs.vllm-ascend-version }}-Qwen2.5-7B-Instruct-V0-report
+          path: ./docs/source/developer_guide/evaluation/accuracy_report
+          github-token: ${{ secrets.GITHUB_TOKEN }}
+          repository: vllm-project/vllm-ascend
+          run-id: ${{ steps.get_Qwen2_5_7B_Instruct_latest_run_id_V0.outputs.runid }}
+
+      - name: Download meta-llama/Llama-3.1-8B-Instruct Artifact
+        uses: actions/download-artifact@v4
+        with:
+          name: ${{ github.event.inputs.vllm-ascend-version }}-Llama-3.1-8B-Instruct-V0-report
+          path: ./docs/source/developer_guide/evaluation/accuracy_report
+          github-token: ${{ secrets.GITHUB_TOKEN }}
+          repository: vllm-project/vllm-ascend
+          run-id: ${{ steps.get_Llama_3_1_8B_Instruct_latest_run_id_V0.outputs.runid }}
+
+      - name: Download Qwen/Qwen3-8B Artifact
+        uses: actions/download-artifact@v4
+        with:
+          name: ${{ github.event.inputs.vllm-ascend-version }}-Qwen3-8B-V0-report
+          path: ./docs/source/developer_guide/evaluation/accuracy_report
+          github-token: ${{ secrets.GITHUB_TOKEN }}
+          repository: vllm-project/vllm-ascend
+          run-id: ${{ steps.get_Qwen3_8B_latest_run_id_V0.outputs.runid }}
+
+      - name: Display Files
+        working-directory: ./docs/source/developer_guide/evaluation/accuracy_report
+        run: |
+          cat ./Qwen2.5-VL-7B-Instruct.md
+          cat ./Llama-3.1-8B-Instruct.md
+          cat ./Qwen2.5-7B-Instruct.md
+          cat ./Qwen3-8B.md
+      
+      - name: Create Pull Request for markdown update
+        uses: peter-evans/create-pull-request@v7
+        with:
+          token: ${{ secrets.PR_TOKEN }}
+          base: ${{ github.ref_name }}
+          branch: auto-pr/accuracy-test
+          commit-message: "Update accuracy report for ${{ github.event.inputs.branch }}"
+          add-paths: ./docs/source/developer_guide/evaluation/accuracy_report/*.md
+          title: "[Doc]Update accuracy report for ${{ github.event.inputs.branch }}"
+          body: |
+            The accuracy results running on Ascend NPU have changed, I'm updating the report.
+            Please review the changes.
+
+            - [Workflow run][1]
+            - [Qwen2.5-7B-Instruct accuracy report][2]
+            - [Llama-3.1-8B-Instruct accuracy report][3]
+            - [Qwen2.5-VL-7B-Instruct accuracy report][4]
+            - [Qwen3-8B accuracy report][5]
+
+            [1]: ${{ github.server_url }}/${{ github.repository }}/actions/runs/${{ github.run_id }}
+            [2]: ${{ github.server_url }}/${{ github.repository }}/actions/runs/${{ steps.get_Qwen2_5_7B_Instruct_latest_run_id_V0.outputs.runid }}
+            [3]: ${{ github.server_url }}/${{ github.repository }}/actions/runs/${{ steps.get_Llama_3_1_8B_Instruct_latest_run_id_V0.outputs.runid }}
+            [4]: ${{ github.server_url }}/${{ github.repository }}/actions/runs/${{ steps.get_Qwen2_5_VL_7B_Instruct_latest_run_id_V0.outputs.runid }}
+            [5]: ${{ github.server_url }}/${{ github.repository }}/actions/runs/${{ steps.get_Qwen3_8B_latest_run_id_V0.outputs.runid }}