[Model] Add qwen3Next support in Main (#4596)

### What this PR does / why we need it? Add Qwen3Next support in main ### Does this PR introduce _any_ user-facing change? ### How was this patch tested? - vLLM version: v0.11.2 - vLLM main: https://github.com/vllm-project/vllm/commit/v0.11.2 --------- Signed-off-by: SunnyLee219 <3294305115@qq.com>
2025-12-03 14:17:37 +08:00
parent 3f81c4bb25
commit 38bd95229f
4 changed files with 7 additions and 3 deletions
--- a/vllm_ascend/ops/triton/mamba/casual_conv1d.py
+++ b/vllm_ascend/ops/triton/mamba/casual_conv1d.py
@@ -7,7 +7,7 @@
 # and https://github.com/vllm-project/vllm/blob/main/vllm/model_executor/layers/mamba/ops/causal_conv1d.py
 # mypy: ignore-errors

-from typing import Optional, Union
+from typing import Any, Optional, Union

 import torch
 import torch.nn.functional as F
@@ -72,6 +72,7 @@ def causal_conv1d_fn(
    conv_states: Optional[torch.Tensor] = None,
    activation: Optional[str] = "silu",
    pad_slot_id: int = PAD_SLOT_ID,
+    metadata: Optional[Any] = None,
 ):
    """
    x: (batch, dim, seqlen) or (dim,cu_seq_len) for varlen