Fix mixed chunked prefill (#1850)

This commit is contained in:
Lianmin Zheng
2024-10-30 21:20:41 -07:00
committed by GitHub
parent a7a0a6886b
commit f7102fbd2b
3 changed files with 80 additions and 23 deletions

View File

@@ -8,6 +8,7 @@ from sglang.test.test_utils import (
DEFAULT_MODEL_NAME_FOR_TEST,
run_bench_serving,
run_mmlu_test,
run_mulit_request_test,
)
@@ -39,6 +40,12 @@ class TestChunkedPrefill(unittest.TestCase):
assert res["completed"] == 10
def test_mixed_chunked_prefill_multi_requests(self):
run_mulit_request_test(
enable_mixed_chunk=True,
chunked_prefill_size=2048,
)
if __name__ == "__main__":
unittest.main()