diff --git a/vllm_ascend/ops/rotary_embedding.py b/vllm_ascend/ops/rotary_embedding.py index afc01d55..04c9d302 100644 --- a/vllm_ascend/ops/rotary_embedding.py +++ b/vllm_ascend/ops/rotary_embedding.py @@ -586,7 +586,7 @@ class AscendMRotaryEmbedding(MRotaryEmbedding): query: torch.Tensor, key: torch.Tensor, ): - if HAS_TRITON and positions.ndim == 2: + if HAS_TRITON and positions.ndim == 2 and self.mrope_interleaved: # todo: need cann update in 8.5.0 return self.forward_triton(positions, query, key)