Support VILA models (#6106)

This commit is contained in:
Zijian
2025-06-12 02:47:25 +08:00
committed by GitHub
parent 02543b545c
commit 31d6dee5c4
7 changed files with 419 additions and 3 deletions

View File

@@ -399,7 +399,7 @@ async def async_request_sglang_generate(
# NOTE: Some completion API might have a last
# usage summary response without a token so we
# want to check a token was generated
if data["text"]:
if "text" in data and data["text"]:
timestamp = time.perf_counter()
generated_text = data["text"]
output_len = data["meta_info"]["completion_tokens"]