add sglang version to get_server_info (#2206)
This commit is contained in:
@@ -86,6 +86,7 @@ from sglang.srt.utils import (
|
|||||||
set_ulimit,
|
set_ulimit,
|
||||||
)
|
)
|
||||||
from sglang.utils import get_exception_traceback
|
from sglang.utils import get_exception_traceback
|
||||||
|
from sglang.version import __version__
|
||||||
|
|
||||||
logger = logging.getLogger(__name__)
|
logger = logging.getLogger(__name__)
|
||||||
|
|
||||||
@@ -527,6 +528,7 @@ async def _get_server_info():
|
|||||||
**dataclasses.asdict(tokenizer_manager.server_args), # server args
|
**dataclasses.asdict(tokenizer_manager.server_args), # server args
|
||||||
"memory_pool_size": await tokenizer_manager.get_memory_pool_size(), # memory pool size
|
"memory_pool_size": await tokenizer_manager.get_memory_pool_size(), # memory pool size
|
||||||
"max_total_num_tokens": _max_total_num_tokens, # max total num tokens
|
"max_total_num_tokens": _max_total_num_tokens, # max total num tokens
|
||||||
|
"version": __version__,
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
|
|||||||
@@ -226,6 +226,9 @@ class TestSRTEndpoint(unittest.TestCase):
|
|||||||
attention_backend = response_json["attention_backend"]
|
attention_backend = response_json["attention_backend"]
|
||||||
self.assertIsInstance(attention_backend, str)
|
self.assertIsInstance(attention_backend, str)
|
||||||
|
|
||||||
|
version = response_json["version"]
|
||||||
|
self.assertIsInstance(version, str)
|
||||||
|
|
||||||
|
|
||||||
if __name__ == "__main__":
|
if __name__ == "__main__":
|
||||||
unittest.main()
|
unittest.main()
|
||||||
|
|||||||
Reference in New Issue
Block a user