From 31fccf5a4f79032769e899b4982777c89f22e642 Mon Sep 17 00:00:00 2001 From: ishandhanani <82981111+ishandhanani@users.noreply.github.com> Date: Wed, 18 Jun 2025 01:36:43 -0700 Subject: [PATCH] chore: change logs from`INFO` to `DEBUG` for dp and add force quit for tokenizer manager (#7251) --- python/sglang/srt/entrypoints/engine.py | 4 ++-- python/sglang/srt/managers/tokenizer_manager.py | 10 +++++++++- 2 files changed, 11 insertions(+), 3 deletions(-) diff --git a/python/sglang/srt/entrypoints/engine.py b/python/sglang/srt/entrypoints/engine.py index 96d5e0801..34f11d4d5 100644 --- a/python/sglang/srt/entrypoints/engine.py +++ b/python/sglang/srt/entrypoints/engine.py @@ -175,7 +175,7 @@ class Engine(EngineBase): """ if self.server_args.enable_dp_attention: if data_parallel_rank is None: - logger.info("data_parallel_rank not provided, using default dispatch") + logger.debug("data_parallel_rank not provided, using default dispatch") elif data_parallel_rank < 0: raise ValueError("data_parallel_rank must be non-negative") elif data_parallel_rank >= self.server_args.dp_size: @@ -258,7 +258,7 @@ class Engine(EngineBase): if self.server_args.enable_dp_attention: if data_parallel_rank is None: - logger.info("data_parallel_rank not provided, using default dispatch") + logger.debug("data_parallel_rank not provided, using default dispatch") elif data_parallel_rank < 0: raise ValueError("data_parallel_rank must be non-negative") elif data_parallel_rank >= self.server_args.dp_size: diff --git a/python/sglang/srt/managers/tokenizer_manager.py b/python/sglang/srt/managers/tokenizer_manager.py index b6e584d56..fbab668a4 100644 --- a/python/sglang/srt/managers/tokenizer_manager.py +++ b/python/sglang/srt/managers/tokenizer_manager.py @@ -1140,13 +1140,21 @@ class TokenizerManager: remain_num_req = len(self.rid_to_state) if self.health_check_failed: - # if health check failed, we should exit immediately + # if health check failed, exit immediately logger.error( "Signal SIGTERM received while health check failed. Exiting... remaining number of requests: %d", remain_num_req, ) break + elif get_bool_env_var("SGL_FORCE_SHUTDOWN"): + # if force shutdown flag set, exit immediately + logger.error( + "Signal SIGTERM received while force shutdown flag set. Force exiting... remaining number of requests: %d", + remain_num_req, + ) + break + logger.info( f"Gracefully exiting... remaining number of requests {remain_num_req}" )