[fix] PD disaggregation when enable mtp and tp!=dp (#7420)

2025-06-22 03:03:11 +08:00
parent 5ea5d22170
commit 02bf31ef29
3 changed files with 4 additions and 3 deletions
--- a/python/sglang/srt/layers/dp_attention.py
+++ b/python/sglang/srt/layers/dp_attention.py
@@ -310,4 +310,4 @@ def attn_tp_reduce_scatter(


 def attn_tp_all_gather(output_list: List[torch.Tensor], input_: torch.Tensor):
-    return get_attention_tp_group().all_gather(input_, tensor_list=output_list)
+    return get_attention_tp_group().all_gather(input_, output_tensor_list=output_list)