From 52029bd1e3e30a1474ead6bddd20d79a162ebc6f Mon Sep 17 00:00:00 2001 From: fzyzcjy <5236035+fzyzcjy@users.noreply.github.com> Date: Tue, 25 Mar 2025 17:01:21 +0800 Subject: [PATCH] Fix warmup error when dp=1 (#4753) --- python/sglang/srt/entrypoints/http_server.py | 6 ++++++ 1 file changed, 6 insertions(+) diff --git a/python/sglang/srt/entrypoints/http_server.py b/python/sglang/srt/entrypoints/http_server.py index 114204d17..1024370a1 100644 --- a/python/sglang/srt/entrypoints/http_server.py +++ b/python/sglang/srt/entrypoints/http_server.py @@ -761,8 +761,14 @@ def _wait_and_warmup( } if server_args.skip_tokenizer_init: json_data["input_ids"] = [[10, 11, 12] for _ in range(server_args.dp_size)] + # TODO Workaround the bug that embedding errors for list of size 1 + if server_args.dp_size == 1: + json_data["input_ids"] = json_data["input_ids"][0] else: json_data["text"] = ["The capital city of France is"] * server_args.dp_size + # TODO Workaround the bug that embedding errors for list of size 1 + if server_args.dp_size == 1: + json_data["text"] = json_data["text"][0] # Debug dumping if server_args.debug_tensor_dump_input_file: