Improve benchmark scripts (#717)

This commit is contained in:
Ying Sheng
2024-07-24 14:44:14 -07:00
committed by GitHub
parent 08a3bd19cc
commit 30d8e130e7
3 changed files with 6 additions and 7 deletions

View File

@@ -116,13 +116,9 @@ class ModelTpServer:
f"[gpu_id={self.gpu_id}] "
f"max_total_num_tokens={self.max_total_num_tokens}, "
f"max_prefill_tokens={self.max_prefill_tokens}, "
f"max_running_requests={self.max_running_requests}, "
f"context_len={self.model_config.context_len}"
)
if self.tp_rank == 0:
logger.info(
f"[gpu_id={self.gpu_id}] "
f"server_args: {server_args.print_mode_args()}"
)
# Init cache
self.tree_cache = RadixCache(