Auto balance CI tests (#4238)

This commit is contained in:
Lianmin Zheng
2025-03-09 21:05:55 -07:00
committed by GitHub
parent 730d084f2a
commit fbd560028a
5 changed files with 151 additions and 84 deletions

View File

@@ -95,7 +95,7 @@ jobs:
strategy:
fail-fast: false
matrix:
range: [0-6, 6-15, 15-22, 22-32, 32-40, 40-48, 48-100]
part: [0, 1, 2, 3, 4, 5, 6]
steps:
- name: Checkout code
uses: actions/checkout@v3
@@ -109,11 +109,8 @@ jobs:
- name: Run test
timeout-minutes: 30
run: |
RANGE=${{ matrix.range }}
range_begin=${RANGE%-*}
range_end=${RANGE#*-}
cd test/srt
python3 run_suite.py --suite per-commit --range-begin ${range_begin} --range-end ${range_end}
python3 run_suite.py --suite per-commit --auto-partition-id ${{ matrix.part }} --auto-partition-size 7
unit-test-backend-2-gpu:
needs: filter
@@ -340,7 +337,6 @@ jobs:
python3 test_moe_eval_accuracy_large.py
finish:
if: always()
needs: [
unit-test-frontend, unit-test-backend-1-gpu, unit-test-backend-2-gpu,
performance-test-1-gpu-part-1, performance-test-1-gpu-part-2, performance-test-2-gpu,