set CUDA_DEVICE_MAX_CONNECTIONS=1 (#1113)

This commit is contained in:
Lianmin Zheng
2024-08-15 10:47:39 -07:00
committed by GitHub
parent 93d4e354d8
commit 0cb099e20a

View File

@@ -360,6 +360,7 @@ def _set_envs_and_config(server_args: ServerArgs):
os.environ["NCCL_CUMEM_ENABLE"] = "0"
os.environ["NCCL_NVLS_ENABLE"] = "0"
os.environ["TORCH_NCCL_AVOID_RECORD_STREAMS"] = "1"
os.environ["CUDA_DEVICE_MAX_CONNECTIONS"] = "1"
# Set ulimit
set_ulimit()