From 886fcbdd096d88e96656a29f1694a8e31a8517cc Mon Sep 17 00:00:00 2001 From: strgrb Date: Thu, 27 Mar 2025 16:45:37 +0800 Subject: [PATCH] Use apply_rope_with_cos_sin_cache_inplace for DeepSeek (#4764) Co-authored-by: Zhang Kaihong --- python/sglang/srt/layers/rotary_embedding.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/python/sglang/srt/layers/rotary_embedding.py b/python/sglang/srt/layers/rotary_embedding.py index fb6bdd76b..648b97cf0 100644 --- a/python/sglang/srt/layers/rotary_embedding.py +++ b/python/sglang/srt/layers/rotary_embedding.py @@ -645,7 +645,7 @@ class DeepseekScalingRotaryEmbedding(RotaryEmbedding): cache = torch.cat((cos, sin), dim=-1) return cache - def forward( + def forward_native( self, positions: torch.Tensor, query: torch.Tensor,