Improve benchmark scripts (#717)
This commit is contained in:
@@ -116,13 +116,9 @@ class ModelTpServer:
|
||||
f"[gpu_id={self.gpu_id}] "
|
||||
f"max_total_num_tokens={self.max_total_num_tokens}, "
|
||||
f"max_prefill_tokens={self.max_prefill_tokens}, "
|
||||
f"max_running_requests={self.max_running_requests}, "
|
||||
f"context_len={self.model_config.context_len}"
|
||||
)
|
||||
if self.tp_rank == 0:
|
||||
logger.info(
|
||||
f"[gpu_id={self.gpu_id}] "
|
||||
f"server_args: {server_args.print_mode_args()}"
|
||||
)
|
||||
|
||||
# Init cache
|
||||
self.tree_cache = RadixCache(
|
||||
|
||||
Reference in New Issue
Block a user