Support VILA models (#6106)

2025-06-12 02:47:25 +08:00
parent 02543b545c
commit 31d6dee5c4
7 changed files with 419 additions and 3 deletions
--- a/python/sglang/bench_serving.py
+++ b/python/sglang/bench_serving.py
@@ -399,7 +399,7 @@ async def async_request_sglang_generate(
                            # NOTE: Some completion API might have a last
                            # usage summary response without a token so we
                            # want to check a token was generated
-                            if data["text"]:
+                            if "text" in data and data["text"]:
                                timestamp = time.perf_counter()
                                generated_text = data["text"]
                                output_len = data["meta_info"]["completion_tokens"]