[Fix] Reduce busy polling when scheduler is idle (#6026)

This commit is contained in:
Povilas Kanapickas
2025-06-13 00:58:22 +03:00
committed by GitHub
parent 4b9971e401
commit bd7cfbd2f8
5 changed files with 48 additions and 1 deletions

View File

@@ -90,6 +90,7 @@ class ServerArgs:
download_dir: Optional[str] = None
base_gpu_id: int = 0
gpu_id_step: int = 1
sleep_on_idle: bool = False
# Logging
log_level: str = "info"
@@ -844,6 +845,11 @@ class ServerArgs:
default=ServerArgs.gpu_id_step,
help="The delta between consecutive GPU IDs that are used. For example, setting it to 2 will use GPU 0,2,4,...",
)
parser.add_argument(
"--sleep-on-idle",
action="store_true",
help="Reduce CPU usage when sglang is idle.",
)
# Logging
parser.add_argument(