From 4839999b76b217e90ea6827b47fb001b373ac080 Mon Sep 17 00:00:00 2001 From: fzyzcjy <5236035+fzyzcjy@users.noreply.github.com> Date: Thu, 29 May 2025 06:53:51 +0800 Subject: [PATCH] Overlap two kernels in DeepSeek with communication (#6711) --- python/sglang/srt/operations_strategy.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/python/sglang/srt/operations_strategy.py b/python/sglang/srt/operations_strategy.py index 6fd32e66a..8821a05eb 100644 --- a/python/sglang/srt/operations_strategy.py +++ b/python/sglang/srt/operations_strategy.py @@ -127,9 +127,9 @@ def _compute_moe_deepseek_blog_decode(layer): layer.mlp.op_combine_a, operations.YieldOperation(), layer.mlp.op_combine_b, + operations.YieldOperation(), layer.mlp.op_output, layer.op_comm_postprocess_layer, - operations.YieldOperation(), ], )