[CI] Reorganize the 8 gpu tests (#6192)

This commit is contained in:
Lianmin Zheng
2025-05-11 10:55:06 -07:00
committed by GitHub
parent 01bdbf7f80
commit 03227c5fa6
6 changed files with 15 additions and 82 deletions

View File

@@ -305,6 +305,12 @@ class ServerArgs:
if self.grammar_backend is None:
self.grammar_backend = "xgrammar"
if self.pp_size > 1:
self.disable_overlap_schedule = True
logger.warning(
"Overlap scheduler is disabled because of using pipeline parallelism."
)
# Data parallelism attention
if self.enable_dp_attention:
self.schedule_conservativeness = self.schedule_conservativeness * 0.3