Fix flakiness in LoRA batch test. (#7552)

2025-06-27 19:51:43 -07:00
parent 9efb2993da
commit 2373faa317
3 changed files with 44 additions and 56 deletions
--- a/python/sglang/test/runners.py
+++ b/python/sglang/test/runners.py
@@ -503,6 +503,7 @@ class SRTRunner:
        disable_overlap_schedule: bool = False,
        disable_custom_all_reduce: bool = False,
        torchao_config: Optional[str] = None,
+        sleep_on_idle=False,
    ):
        self.model_type = model_type
        self.is_generation = model_type == "generation"
@@ -540,6 +541,7 @@ class SRTRunner:
            disable_overlap_schedule=disable_overlap_schedule,
            cuda_graph_max_bs=4,
            disable_custom_all_reduce=disable_custom_all_reduce,
+            sleep_on_idle=sleep_on_idle,
            **spec_kwargs,
        )