diff --git a/python/sglang/srt/layers/rotary_embedding.py b/python/sglang/srt/layers/rotary_embedding.py index aadaf4e3e..88a491e47 100644 --- a/python/sglang/srt/layers/rotary_embedding.py +++ b/python/sglang/srt/layers/rotary_embedding.py @@ -645,7 +645,18 @@ class DeepseekScalingRotaryEmbedding(RotaryEmbedding): cache = torch.cat((cos, sin), dim=-1) return cache - def forward( + def forward_hip(self, *args, **kwargs): + return self.forward_native(*args, **kwargs) + + def forward(self, *args, **kwargs): + if torch._dynamo.is_compiling: + return self.forward_native(*args, **kwargs) + if _is_cuda_available: + return self.forward_cuda(*args, **kwargs) + else: + return self.forward_native(*args, **kwargs) + + def forward_native( self, positions: torch.Tensor, query: torch.Tensor,