From c03cece42f425cc8e73df77a6d1fcc316fd44b50 Mon Sep 17 00:00:00 2001 From: Lianmin Zheng Date: Wed, 11 Sep 2024 04:50:04 -0700 Subject: [PATCH] Improve error reporting during server launch (#1390) --- python/sglang/srt/server.py | 7 ++++--- 1 file changed, 4 insertions(+), 3 deletions(-) diff --git a/python/sglang/srt/server.py b/python/sglang/srt/server.py index 4aaf018a1..5bdee03de 100644 --- a/python/sglang/srt/server.py +++ b/python/sglang/srt/server.py @@ -447,13 +447,12 @@ def _wait_and_warmup(server_args, pipe_finish_writer, pid): time.sleep(1) try: res = requests.get(url + "/get_model_info", timeout=5, headers=headers) - assert res.status_code == 200, f"{res}" + assert res.status_code == 200, f"{res=}, {res.text=}" success = True break - except (AssertionError, requests.exceptions.RequestException) as e: + except (AssertionError, requests.exceptions.RequestException): last_traceback = get_exception_traceback() pass - model_info = res.json() if not success: if pipe_finish_writer is not None: @@ -462,6 +461,8 @@ def _wait_and_warmup(server_args, pipe_finish_writer, pid): kill_child_process(pid, including_parent=False) return + model_info = res.json() + # Send a warmup request request_name = "/generate" if model_info["is_generation"] else "/encode" max_new_tokens = 8 if model_info["is_generation"] else 1