Fix and Clean up chat-template requirement for VLM (#6114)

Signed-off-by: Xinyuan Tong <justinning0323@outlook.com>
2025-05-10 09:14:09 -07:00
parent c178abdabc
commit 9d8ec2e67e
16 changed files with 104 additions and 195 deletions
--- a/test/srt/test_bnb.py
+++ b/test/srt/test_bnb.py
@@ -29,10 +29,10 @@ from sglang.test.test_utils import (
 )

 VISION_MODELS = [
-    ("unsloth/Qwen2.5-VL-7B-Instruct-bnb-4bit", "qwen2-vl"),
-    ("unsloth/Qwen2-VL-7B-Instruct-bnb-4bit", "qwen2-vl"),
-    ("unsloth/Llama-3.2-11B-Vision-Instruct-bnb-4bit", "llama_3_vision"),
-    ("unsloth/Llama-3.2-11B-Vision-bnb-4bit", "llama_3_vision"),
+    "unsloth/Qwen2.5-VL-7B-Instruct-bnb-4bit",
+    "unsloth/Qwen2-VL-7B-Instruct-bnb-4bit",
+    "unsloth/Llama-3.2-11B-Vision-Instruct-bnb-4bit",
+    "unsloth/Llama-3.2-11B-Vision-bnb-4bit",
 ]
 LANGUAGE_MODELS = [
    "unsloth/Qwen2.5-7B-Instruct-bnb-4bit",
@@ -249,11 +249,9 @@ class TestVisionModel(CustomTestCase):
        if is_in_ci():
            models_to_test = [random.choice(VISION_MODELS)]

-        for model, template in models_to_test:
+        for model in models_to_test:
            with self.subTest(model=model):
                other_args = [
-                    "--chat-template",
-                    template,
                    "--mem-fraction-static",
                    "0.6",
                    "--load-format",