[Model]Add support for qwen3_vl and qwen3_vl_moe (#3103)

### What this PR does / why we need it? This PR is for the adaptation and optimization of qwen3_vl and qwen3_vl_moe on the Ascend platform. ### Does this PR introduce _any_ user-facing change? None ### How was this patch tested? - vLLM version: v0.10.2 - vLLM main: b1068903fd --------- Signed-off-by: booker123456 <945658361@qq.com>
2025-09-25 18:50:12 +08:00
parent f7a3815bff
commit 31dda3f557
2 changed files with 256 additions and 13 deletions
--- a/vllm_ascend/models/init.py
+++ b/vllm_ascend/models/init.py
@@ -8,6 +8,16 @@ def register_model():
        "Qwen2VLForConditionalGeneration",
        "vllm_ascend.models.qwen2_vl:AscendQwen2VLForConditionalGeneration")

+    ModelRegistry.register_model(
+        "Qwen3VLMoeForConditionalGeneration",
+        "vllm_ascend.models.qwen2_5_vl_without_padding:AscendQwen3VLMoeForConditionalGeneration"
+    )
+
+    ModelRegistry.register_model(
+        "Qwen3VLForConditionalGeneration",
+        "vllm_ascend.models.qwen2_5_vl_without_padding:AscendQwen3VLForConditionalGeneration"
+    )
+
    if envs_ascend.USE_OPTIMIZED_MODEL:
        ModelRegistry.register_model(
            "Qwen2_5_VLForConditionalGeneration",