diff --git a/python/sglang/srt/distributed/parallel_state.py b/python/sglang/srt/distributed/parallel_state.py index e0d533479..464bd2b17 100644 --- a/python/sglang/srt/distributed/parallel_state.py +++ b/python/sglang/srt/distributed/parallel_state.py @@ -1539,6 +1539,7 @@ def initialize_model_parallel( group_name="tp", pynccl_use_current_stream=duplicate_tp_group, torch_compile=torch_compile, + use_custom_allreduce = False, ) if duplicate_tp_group: