Move mem_fraction_static adjustment for multimodal models to server_args.py & Fix session control & Other cleanups (#7748)

This commit is contained in:
Lianmin Zheng
2025-07-04 16:33:33 -07:00
committed by GitHub
parent 975a5ec69c
commit 14229ccf8f
16 changed files with 339 additions and 137 deletions

View File

@@ -1148,6 +1148,7 @@ class TokenizerManager:
[
"text",
"output_ids",
"embedding",
]
)
elif self.log_requests_level == 1:
@@ -1166,6 +1167,7 @@ class TokenizerManager:
[
"text",
"output_ids",
"embedding",
]
)
elif self.log_requests_level == 2: