Make decode log interval configurable (#1847)
This commit is contained in:
@@ -919,7 +919,7 @@ class Scheduler:
|
||||
self.token_to_kv_pool.free_group_end()
|
||||
|
||||
self.forward_ct_decode = (self.forward_ct_decode + 1) % (1 << 30)
|
||||
if self.tp_rank == 0 and self.forward_ct_decode % 40 == 0:
|
||||
if self.tp_rank == 0 and self.forward_ct_decode % self.server_args.decode_log_interval == 0:
|
||||
self.print_decode_stats()
|
||||
|
||||
def add_logprob_return_values(
|
||||
|
||||
@@ -63,6 +63,7 @@ class ServerArgs:
|
||||
stream_interval: int = 1
|
||||
random_seed: Optional[int] = None
|
||||
constrained_json_whitespace_pattern: Optional[str] = None
|
||||
decode_log_interval: int = 40
|
||||
|
||||
# Logging
|
||||
log_level: str = "info"
|
||||
@@ -436,6 +437,12 @@ class ServerArgs:
|
||||
default=ServerArgs.watchdog_timeout,
|
||||
help="Set watchdog timeout in seconds. If a forward batch takes longer than this, the server will crash to prevent hanging.",
|
||||
)
|
||||
parser.add_argument(
|
||||
"--decode-log-interval",
|
||||
type=int,
|
||||
default=ServerArgs.decode_log_interval,
|
||||
help="The log interval of decode batch"
|
||||
)
|
||||
|
||||
# Data parallelism
|
||||
parser.add_argument(
|
||||
|
||||
Reference in New Issue
Block a user