From 19f33b3237fb4dbdb6c7431fb45a2c5548713acb Mon Sep 17 00:00:00 2001 From: Yudi Xue <10211+binarycrayon@users.noreply.github.com> Date: Tue, 26 Nov 2024 12:10:23 -0800 Subject: [PATCH] add sglang version to get_server_info (#2206) --- python/sglang/srt/server.py | 2 ++ test/srt/test_srt_endpoint.py | 3 +++ 2 files changed, 5 insertions(+) diff --git a/python/sglang/srt/server.py b/python/sglang/srt/server.py index 238d265b6..0d303c2cb 100644 --- a/python/sglang/srt/server.py +++ b/python/sglang/srt/server.py @@ -86,6 +86,7 @@ from sglang.srt.utils import ( set_ulimit, ) from sglang.utils import get_exception_traceback +from sglang.version import __version__ logger = logging.getLogger(__name__) @@ -527,6 +528,7 @@ async def _get_server_info(): **dataclasses.asdict(tokenizer_manager.server_args), # server args "memory_pool_size": await tokenizer_manager.get_memory_pool_size(), # memory pool size "max_total_num_tokens": _max_total_num_tokens, # max total num tokens + "version": __version__, } diff --git a/test/srt/test_srt_endpoint.py b/test/srt/test_srt_endpoint.py index 9f2e15641..fb50943f1 100644 --- a/test/srt/test_srt_endpoint.py +++ b/test/srt/test_srt_endpoint.py @@ -226,6 +226,9 @@ class TestSRTEndpoint(unittest.TestCase): attention_backend = response_json["attention_backend"] self.assertIsInstance(attention_backend, str) + version = response_json["version"] + self.assertIsInstance(version, str) + if __name__ == "__main__": unittest.main()