reverse the amd ci test back to 1200s and split the 8-gpu deepseek job into two. (#11238)

Co-authored-by: root <root@smci350-zts-gtu-e17-15.zts-gtu.dcgpu>
This commit is contained in:
sunxxuns
2025-10-06 19:27:57 -04:00
committed by GitHub
parent 708f4ff490
commit a57f0e3d56
4 changed files with 84 additions and 58 deletions

View File

@@ -152,7 +152,8 @@ suites = {
TestFile("test_disaggregation_dp_attention.py", 155),
TestFile("test_disaggregation_different_tp.py", 600),
TestFile("test_disaggregation_pp.py", 140),
TestFile("test_full_deepseek_v3.py", 550),
TestFile("test_deepseek_v3_basic.py", 275),
TestFile("test_deepseek_v3_mtp.py", 275),
],
"per-commit-4-gpu-b200": [
# TestFile("test_gpt_oss_4gpu.py", 600),
@@ -267,7 +268,8 @@ suite_amd = {
TestFile("test_pp_single_node.py", 150),
],
"per-commit-8-gpu-amd": [
TestFile("test_full_deepseek_v3.py", 250),
TestFile("test_deepseek_v3_basic.py", 275),
TestFile("test_deepseek_v3_mtp.py", 275),
],
"nightly-amd": [
TestFile("test_nightly_gsm8k_eval_amd.py"),
@@ -369,7 +371,7 @@ if __name__ == "__main__":
arg_parser.add_argument(
"--timeout-per-file",
type=int,
default=1500 if is_hip() else 1200,
default=1200,
help="The time limit for running one file in seconds.",
)
arg_parser.add_argument(