diff --git a/python/sglang/srt/managers/controller/tp_worker.py b/python/sglang/srt/managers/controller/tp_worker.py index b07528141..baf509877 100644 --- a/python/sglang/srt/managers/controller/tp_worker.py +++ b/python/sglang/srt/managers/controller/tp_worker.py @@ -104,8 +104,7 @@ class ModelTpServer: else server_args.max_running_requests ) self.max_running_requests = min( - self.max_running_requests, - self.model_runner.req_to_token_pool.size - 1 + self.max_running_requests, self.model_runner.req_to_token_pool.size - 1 ) self.int_token_logit_bias = torch.tensor( get_int_token_logit_bias(self.tokenizer, self.model_config.vocab_size)