[ModelRunner] Add hunyuan-vl basic support (#5151)

### What this PR does / why we need it? This patch add handling of `XDRotaryEmbedding` in modelrunner to support for `hunyuan-vl` ### Does this PR introduce _any_ user-facing change? ### How was this patch tested? CI passed with added/exist tests Closes: https://github.com/vllm-project/vllm-ascend/issues/4992 - vLLM version: v0.12.0 - vLLM main: ad32e3e19c --------- Signed-off-by: wangli <wangli858794774@gmail.com>
2025-12-23 10:46:54 +08:00
parent c9b5881bcd
commit 9a79cbaecb
3 changed files with 63 additions and 25 deletions
--- a/tests/e2e/conftest.py
+++ b/tests/e2e/conftest.py
@@ -763,11 +763,32 @@ def qwen_prompt(questions: list[str]) -> list[str]:
             f"{q}<|im_end|>\n<|im_start|>assistant\n") for q in questions]


-PROMPT_TEMPLATES = {
-    "qwen2.5vl": qwen_prompt,
+def hunyuan_prompt(questions: list[str]) -> list[str]:
+    placeholder = "<｜hy_place▁holder▁no▁100｜><｜hy_place▁holder▁no▁102｜><｜hy_place▁holder▁no▁101｜>"  # noqa: E501
+    return [
+        f"<｜hy_begin▁of▁sentence｜>{placeholder}{question}<｜hy_User｜>"
+        for question in questions
+    ]
+
+
+PROMPT_CONFIGS = {
+    "qwen-vl": {
+        "model": "Qwen/Qwen3-VL-8B-Instruct",
+        "prompt_fn": qwen_prompt,
+        "mm_processor_kwargs": {
+            "min_pixels": 28 * 28,
+            "max_pixels": 1280 * 28 * 28,
+            "fps": 1,
+        },
+    },
+    "hunyuan-vl": {
+        "model": "Tencent-Hunyuan/HunyuanOCR",
+        "prompt_fn": hunyuan_prompt,
+        "mm_processor_kwargs": {},
+    },
 }


-@pytest.fixture(params=list(PROMPT_TEMPLATES.keys()))
-def prompt_template(request):
-    return PROMPT_TEMPLATES[request.param]
+@pytest.fixture(params=PROMPT_CONFIGS.keys())
+def vl_config(request):
+    return PROMPT_CONFIGS[request.param]