Log iteration # for prefill and decode (#9366)
This commit is contained in:
@@ -123,7 +123,7 @@ class SchedulerMetricsMixin:
|
||||
token_usage_msg = f"token usage: {token_usage:.2f}, "
|
||||
|
||||
f = (
|
||||
f"Prefill batch. "
|
||||
f"Prefill batch [{self.forward_ct + 1}], "
|
||||
f"#new-seq: {len(can_run_list)}, "
|
||||
f"#new-token: {adder.log_input_tokens}, "
|
||||
f"#cached-token: {adder.log_hit_tokens}, "
|
||||
@@ -246,7 +246,7 @@ class SchedulerMetricsMixin:
|
||||
gap_latency / self.server_args.decode_log_interval
|
||||
)
|
||||
|
||||
msg = f"Decode batch. #running-req: {num_running_reqs}, {token_usage_msg}"
|
||||
msg = f"Decode batch [{self.forward_ct}], #running-req: {num_running_reqs}, {token_usage_msg}"
|
||||
|
||||
if self.spec_algorithm.is_none():
|
||||
spec_accept_length = 0
|
||||
|
||||
Reference in New Issue
Block a user