diff --git a/python/sglang/srt/managers/tp_worker.py b/python/sglang/srt/managers/tp_worker.py index 017f9a1f8..1cdc48c25 100644 --- a/python/sglang/srt/managers/tp_worker.py +++ b/python/sglang/srt/managers/tp_worker.py @@ -146,7 +146,7 @@ class TpModelWorker: assert self.max_running_requests > 0, "max_running_request is zero" self.max_queued_requests = server_args.max_queued_requests assert ( - self.max_running_requests > 0 + self.max_queued_requests > 0 ), "max_queued_requests is zero. We need to be at least 1 to schedule a request." self.max_req_len = min( self.model_config.context_len - 1,