Add a new event loop (#1677)

This commit is contained in:
Lianmin Zheng
2024-10-16 01:33:20 -07:00
committed by GitHub
parent a5114b6f91
commit 9116b2896f
9 changed files with 161 additions and 25 deletions

View File

@@ -113,6 +113,7 @@ class ServerArgs:
disable_custom_all_reduce: bool = False
disable_mla: bool = False
disable_penalizer: bool = False
enable_overlap_schedule: bool = False
enable_mixed_chunk: bool = False
enable_torch_compile: bool = False
max_torch_compile_bs: int = 32
@@ -572,6 +573,11 @@ class ServerArgs:
action="store_true",
help="Disable the logit penalizer (e.g., frequency and repetition penalty).",
)
parser.add_argument(
"--enable-overlap-schedule",
action="store_true",
help="Overlap the CPU scheduler with GPU model worker. Experimental feature.",
)
parser.add_argument(
"--enable-mixed-chunk",
action="store_true",