From 22bfed75094d10c18228aec813f0f21ec124d8be Mon Sep 17 00:00:00 2001 From: Cheng Wan <54331508+ch-wan@users.noreply.github.com> Date: Fri, 20 Jun 2025 14:45:16 -0700 Subject: [PATCH] [DeepSeekNextN] fix: residual of head norm can be None (#7398) --- python/sglang/srt/models/deepseek_nextn.py | 6 +++++- 1 file changed, 5 insertions(+), 1 deletion(-) diff --git a/python/sglang/srt/models/deepseek_nextn.py b/python/sglang/srt/models/deepseek_nextn.py index 8d7bc7b18..7ca945d3a 100644 --- a/python/sglang/srt/models/deepseek_nextn.py +++ b/python/sglang/srt/models/deepseek_nextn.py @@ -107,7 +107,11 @@ class DeepseekModelNextN(nn.Module): ) if not forward_batch.forward_mode.is_idle(): - hidden_states, _ = self.shared_head.norm(hidden_states, residual) + if residual is not None: + hidden_states, _ = self.shared_head.norm(hidden_states, residual) + else: + hidden_states = self.shared_head.norm(hidden_states) + return hidden_states