feat: add priority based scheduling with priority based request acceptance and preemption (#8746)

This commit is contained in:
harrisonlimh
2025-09-16 17:10:10 -07:00
committed by GitHub
parent f949ad5794
commit 14fdd52740
16 changed files with 822 additions and 71 deletions

View File

@@ -65,9 +65,8 @@ class TestMaxQueuedRequests(CustomTestCase):
send_concurrent_generate_requests(self.base_url, num_requests=10)
)
assert 200 in status_codes
assert 503 in status_codes
assert all(status_code in [200, 503] for status_code in status_codes)
expected_status_codes = [200, 200, 503, 503, 503, 503, 503, 503, 503, 503]
assert status_codes == expected_status_codes
def test_max_running_requests_and_max_queued_request_validation(self):
"""Verify running request and queued request numbers based on server logs."""