feat: add priority based scheduling with priority based request acceptance and preemption (#8746)
This commit is contained in:
@@ -95,6 +95,7 @@ suites = {
|
||||
TestFile("test_original_logprobs.py", 200),
|
||||
TestFile("test_penalty.py", 41),
|
||||
TestFile("test_page_size.py", 60),
|
||||
TestFile("test_priority_scheduling.py", 100),
|
||||
TestFile("test_pytorch_sampling_backend.py", 66),
|
||||
TestFile("test_radix_attention.py", 105),
|
||||
TestFile("test_regex_constrained.py", 64),
|
||||
|
||||
Reference in New Issue
Block a user