[Fix] Reduce busy polling when scheduler is idle (#6026)
This commit is contained in:
committed by
GitHub
parent
4b9971e401
commit
bd7cfbd2f8
@@ -90,6 +90,7 @@ class ServerArgs:
|
||||
download_dir: Optional[str] = None
|
||||
base_gpu_id: int = 0
|
||||
gpu_id_step: int = 1
|
||||
sleep_on_idle: bool = False
|
||||
|
||||
# Logging
|
||||
log_level: str = "info"
|
||||
@@ -844,6 +845,11 @@ class ServerArgs:
|
||||
default=ServerArgs.gpu_id_step,
|
||||
help="The delta between consecutive GPU IDs that are used. For example, setting it to 2 will use GPU 0,2,4,...",
|
||||
)
|
||||
parser.add_argument(
|
||||
"--sleep-on-idle",
|
||||
action="store_true",
|
||||
help="Reduce CPU usage when sglang is idle.",
|
||||
)
|
||||
|
||||
# Logging
|
||||
parser.add_argument(
|
||||
|
||||
Reference in New Issue
Block a user