Enable chunked prefill by default (#1040)

This commit is contained in:
Lianmin Zheng
2024-08-14 21:56:20 -07:00
committed by GitHub
parent 8d2d876fc8
commit e86b1ccbf0
4 changed files with 10 additions and 10 deletions

View File

@@ -47,8 +47,8 @@ jobs:
python3 -m unittest test_serving_throughput.TestServingThroughput.test_default_without_radix_cache
timeout-minutes: 10
- name: Benchmark Serving Throughput (w/ ChunkedPrefill)
- name: Benchmark Serving Throughput (w/o ChunkedPrefill)
run: |
cd test/srt
python3 -m unittest test_serving_throughput.TestServingThroughput.test_default_with_chunked_prefill
python3 -m unittest test_serving_throughput.TestServingThroughput.test_default_without_chunked_prefill
timeout-minutes: 10