diff --git a/python/sglang/srt/server.py b/python/sglang/srt/server.py index ae886796c59..4f06f76300b 100644 --- a/python/sglang/srt/server.py +++ b/python/sglang/srt/server.py @@ -360,6 +360,7 @@ def _set_envs_and_config(server_args: ServerArgs): os.environ["NCCL_CUMEM_ENABLE"] = "0" os.environ["NCCL_NVLS_ENABLE"] = "0" os.environ["TORCH_NCCL_AVOID_RECORD_STREAMS"] = "1" + os.environ["CUDA_DEVICE_MAX_CONNECTIONS"] = "1" # Set ulimit set_ulimit()