diff --git a/python/sglang/srt/models/deepseek_v2.py b/python/sglang/srt/models/deepseek_v2.py index 1a5165030..d83a7bb06 100644 --- a/python/sglang/srt/models/deepseek_v2.py +++ b/python/sglang/srt/models/deepseek_v2.py @@ -1895,11 +1895,6 @@ class DeepseekV2DecoderLayer(nn.Module): hidden_states, residual, forward_batch ) - if self.enable_dp_attention and self.speculative_algorithm.is_eagle(): - # NOTE: this line resolves the degradation of MTP reception rate for non-zero DP ranks. - # See discussion here (https://github.com/sgl-project/sglang/pull/6081#discussion_r2147452251). - hidden_states = hidden_states.clone() - return hidden_states, residual def op_comm_prepare_attn(