Update CI runner docs (#1213)

This commit is contained in:
Lianmin Zheng
2024-08-25 17:31:52 -07:00
committed by GitHub
parent 15f1a49d2d
commit 61bb223e0f
2 changed files with 34 additions and 79 deletions

View File

@@ -33,13 +33,13 @@ jobs:
pip install flashinfer -i https://flashinfer.ai/whl/cu121/torch2.4/ --force-reinstall
- name: Benchmark MoE Serving Throughput
timeout_minutes: 10
timeout-minutes: 10
run: |
cd test/srt
python3 -m unittest test_moe_serving_throughput.TestServingThroughput.test_default
- name: Benchmark MoE Serving Throughput (w/o RadixAttention)
timeout_minutes: 10
timeout-minutes: 10
run: |
cd test/srt
python3 -m unittest test_moe_serving_throughput.TestServingThroughput.test_default_without_radix_cache