Tiny support setting numa nodes for different ranks (#10006)

This commit is contained in:
fzyzcjy
2025-09-05 19:01:27 +08:00
committed by GitHub
parent 339f8eef09
commit df97b31f37
3 changed files with 20 additions and 0 deletions

View File

@@ -351,6 +351,7 @@ class ServerArgs:
disable_fast_image_processor: bool = False
enable_return_hidden_states: bool = False
scheduler_recv_interval: int = 1
numa_node: Optional[List[int]] = None
# Debug tensor dumps
debug_tensor_dump_output_folder: Optional[str] = None
@@ -1991,6 +1992,12 @@ class ServerArgs:
default=ServerArgs.scheduler_recv_interval,
help="The interval to poll requests in scheduler. Can be set to >1 to reduce the overhead of this.",
)
parser.add_argument(
"--numa-node",
type=int,
nargs="+",
help="Sets the numa node for the subprocesses. i-th element corresponds to i-th subprocess.",
)
# Debug tensor dumps
parser.add_argument(