Add --enable-p2p-check option (#599)

This commit is contained in:
Liangsheng Yin
2024-07-06 23:34:10 -07:00
committed by GitHub
parent 26908d9568
commit 5304b4ef58
4 changed files with 13 additions and 9 deletions

View File

@@ -55,6 +55,7 @@ class ServerArgs:
disable_regex_jump_forward: bool = False
disable_disk_cache: bool = False
attention_reduce_in_fp32: bool = False
enable_p2p_check: bool = False
# Distributed args
nccl_init_addr: Optional[str] = None
@@ -304,6 +305,11 @@ class ServerArgs:
help="Cast the intermidiate attention results to fp32 to avoid possible crashes related to fp16."
"This only affects Triton attention kernels",
)
parser.add_argument(
"--enable-p2p-check",
action="store_true",
help="Enable P2P check for GPU access, otherwise the p2p access is allowed by default.",
)
@classmethod
def from_cli_args(cls, args: argparse.Namespace):