Adjust concurrency group for each npu workflow (#1068)

### What this PR does / why we need it?
Adjust concurrency group for each npu workflow
- for pd and benchmarks share the static-08-01, so only one job can runs
on
- other job one PR/schedule should have only 1 job runs

### Does this PR introduce _any_ user-facing change?
No

### How was this patch tested?
CI passed

Signed-off-by: Yikun Jiang <yikunkero@gmail.com>
This commit is contained in:
Yikun Jiang
2025-06-05 09:17:04 +08:00
committed by GitHub
parent afc4c0cd03
commit 9e855b70be
4 changed files with 10 additions and 15 deletions

View File

@@ -62,8 +62,9 @@ defaults:
run:
shell: bash -el {0}
# only cancel in-progress runs of the same workflow
concurrency:
group: pr-${{ github.event.pull_request.number }}
group: ${{ github.workflow }}-${{ github.ref }}
cancel-in-progress: true
jobs:

View File

@@ -33,9 +33,10 @@ defaults:
run:
shell: bash -el {0}
# only 1 job can runs on static-8-01-cards
concurrency:
group: pr-${{ github.event.pull_request.number }}
cancel-in-progress: true
group: static-8-01-cards
cancel-in-progress: false
jobs:
test:

View File

@@ -30,8 +30,9 @@ defaults:
run:
shell: bash -el {0}
# only cancel in-progress runs of the same workflow
concurrency:
group: pr-${{ github.event.pull_request.number }}
group: ${{ github.workflow }}-${{ github.ref }}
cancel-in-progress: true
jobs:
@@ -43,15 +44,6 @@ jobs:
matrix:
os: [linux-arm64-npu-1, linux-arm64-npu-4]
vllm_version: [main, v0.9.0]
concurrency:
group: >
${{
matrix.os == 'linux-arm64-npu-4'
&& github.event.pull_request.number
&& format('pr-{0}-limit-npu-4-long-term', github.event.pull_request.number)
|| format('job-{0}-{1}-{2}-long-term', matrix.os, matrix.vllm_version, github.event.pull_request.number)
}}
cancel-in-progress: false
name: vLLM Ascend long term test
runs-on: ${{ matrix.os }}
container:

View File

@@ -30,9 +30,10 @@ defaults:
run:
shell: bash -el {0}
# only 1 job can runs on static-8-01-cards
concurrency:
group: pr-${{ github.event.pull_request.number }}
cancel-in-progress: true
group: static-8-01-cards
cancel-in-progress: false
jobs:
prefilling-decoding-disaggregation: