Fix assertion typo in tp_worker.py (#9954)

This commit is contained in:
Seunggeun Cho
2025-09-10 14:43:50 +09:00
committed by GitHub
parent 4efe2c57c9
commit 0ac809de33

View File

@@ -146,7 +146,7 @@ class TpModelWorker:
assert self.max_running_requests > 0, "max_running_request is zero"
self.max_queued_requests = server_args.max_queued_requests
assert (
self.max_running_requests > 0
self.max_queued_requests > 0
), "max_queued_requests is zero. We need to be at least 1 to schedule a request."
self.max_req_len = min(
self.model_config.context_len - 1,