chore: change logs fromINFO to DEBUG for dp and add force quit for tokenizer manager (#7251)
This commit is contained in:
@@ -175,7 +175,7 @@ class Engine(EngineBase):
|
||||
"""
|
||||
if self.server_args.enable_dp_attention:
|
||||
if data_parallel_rank is None:
|
||||
logger.info("data_parallel_rank not provided, using default dispatch")
|
||||
logger.debug("data_parallel_rank not provided, using default dispatch")
|
||||
elif data_parallel_rank < 0:
|
||||
raise ValueError("data_parallel_rank must be non-negative")
|
||||
elif data_parallel_rank >= self.server_args.dp_size:
|
||||
@@ -258,7 +258,7 @@ class Engine(EngineBase):
|
||||
|
||||
if self.server_args.enable_dp_attention:
|
||||
if data_parallel_rank is None:
|
||||
logger.info("data_parallel_rank not provided, using default dispatch")
|
||||
logger.debug("data_parallel_rank not provided, using default dispatch")
|
||||
elif data_parallel_rank < 0:
|
||||
raise ValueError("data_parallel_rank must be non-negative")
|
||||
elif data_parallel_rank >= self.server_args.dp_size:
|
||||
|
||||
@@ -1140,13 +1140,21 @@ class TokenizerManager:
|
||||
remain_num_req = len(self.rid_to_state)
|
||||
|
||||
if self.health_check_failed:
|
||||
# if health check failed, we should exit immediately
|
||||
# if health check failed, exit immediately
|
||||
logger.error(
|
||||
"Signal SIGTERM received while health check failed. Exiting... remaining number of requests: %d",
|
||||
remain_num_req,
|
||||
)
|
||||
break
|
||||
|
||||
elif get_bool_env_var("SGL_FORCE_SHUTDOWN"):
|
||||
# if force shutdown flag set, exit immediately
|
||||
logger.error(
|
||||
"Signal SIGTERM received while force shutdown flag set. Force exiting... remaining number of requests: %d",
|
||||
remain_num_req,
|
||||
)
|
||||
break
|
||||
|
||||
logger.info(
|
||||
f"Gracefully exiting... remaining number of requests {remain_num_req}"
|
||||
)
|
||||
|
||||
Reference in New Issue
Block a user