Improve error reporting during server launch (#1390)

2024-09-11 04:50:04 -07:00
parent 15c75e4146
commit c03cece42f
1 changed files with 4 additions and 3 deletions
--- a/python/sglang/srt/server.py
+++ b/python/sglang/srt/server.py
@@ -447,13 +447,12 @@ def _wait_and_warmup(server_args, pipe_finish_writer, pid):
        time.sleep(1)
        try:
            res = requests.get(url + "/get_model_info", timeout=5, headers=headers)
-            assert res.status_code == 200, f"{res}"
+            assert res.status_code == 200, f"{res=}, {res.text=}"
            success = True
            break
-        except (AssertionError, requests.exceptions.RequestException) as e:
+        except (AssertionError, requests.exceptions.RequestException):
            last_traceback = get_exception_traceback()
            pass
    model_info = res.json()
    if not success:
        if pipe_finish_writer is not None:
@@ -462,6 +461,8 @@ def _wait_and_warmup(server_args, pipe_finish_writer, pid):
        kill_child_process(pid, including_parent=False)
        return
    model_info = res.json()
    # Send a warmup request
    request_name = "/generate" if model_info["is_generation"] else "/encode"
    max_new_tokens = 8 if model_info["is_generation"] else 1