[CI] Split test cases in CI for better load balancing (#2180)

This commit is contained in:
Lianmin Zheng
2024-11-25 04:58:16 -08:00
committed by GitHub
parent 538fa0ae13
commit 254fd130e2
6 changed files with 37 additions and 23 deletions

View File

@@ -17,7 +17,8 @@ suites = {
"test_json_constrained.py",
"test_large_max_new_tokens.py",
"test_metrics.py",
"test_non_overlap_scheduler.py",
"test_no_chunked_prefill.py",
"test_no_overlap_scheduler.py",
"test_openai_server.py",
"test_pytorch_sampling_backend.py",
"test_radix_attention.py",