ci: update timeout and retry (#1086)
Co-authored-by: Liangsheng Yin <hnyls2002@gmail.com>
This commit is contained in:
4
.github/workflows/accuracy-test.yml
vendored
4
.github/workflows/accuracy-test.yml
vendored
@@ -6,11 +6,13 @@ on:
|
|||||||
paths:
|
paths:
|
||||||
- "python/sglang/**"
|
- "python/sglang/**"
|
||||||
- "test/**"
|
- "test/**"
|
||||||
|
- ".github/workflows/accuracy-test.yml"
|
||||||
pull_request:
|
pull_request:
|
||||||
branches: [ main ]
|
branches: [ main ]
|
||||||
paths:
|
paths:
|
||||||
- "python/sglang/**"
|
- "python/sglang/**"
|
||||||
- "test/**"
|
- "test/**"
|
||||||
|
- ".github/workflows/accuracy-test.yml"
|
||||||
workflow_dispatch:
|
workflow_dispatch:
|
||||||
|
|
||||||
concurrency:
|
concurrency:
|
||||||
@@ -43,4 +45,4 @@ jobs:
|
|||||||
run: |
|
run: |
|
||||||
cd test/srt
|
cd test/srt
|
||||||
python3 test_eval_accuracy_large.py
|
python3 test_eval_accuracy_large.py
|
||||||
timeout-minutes: 20
|
timeout-minutes: 10
|
||||||
|
|||||||
5
.github/workflows/e2e-test.yml
vendored
5
.github/workflows/e2e-test.yml
vendored
@@ -6,11 +6,13 @@ on:
|
|||||||
paths:
|
paths:
|
||||||
- "python/sglang/**"
|
- "python/sglang/**"
|
||||||
- "test/**"
|
- "test/**"
|
||||||
|
- ".github/workflows/e2e-test.yml"
|
||||||
pull_request:
|
pull_request:
|
||||||
branches: [ main ]
|
branches: [ main ]
|
||||||
paths:
|
paths:
|
||||||
- "python/sglang/**"
|
- "python/sglang/**"
|
||||||
- "test/**"
|
- "test/**"
|
||||||
|
- ".github/workflows/e2e-test.yml"
|
||||||
workflow_dispatch:
|
workflow_dispatch:
|
||||||
|
|
||||||
concurrency:
|
concurrency:
|
||||||
@@ -39,13 +41,16 @@ jobs:
|
|||||||
run: |
|
run: |
|
||||||
cd test/srt
|
cd test/srt
|
||||||
python3 -m unittest test_serving_throughput.TestServingThroughput.test_default
|
python3 -m unittest test_serving_throughput.TestServingThroughput.test_default
|
||||||
|
timeout-minutes: 10
|
||||||
|
|
||||||
- name: Benchmark Serving Throughput (w/o RadixAttention)
|
- name: Benchmark Serving Throughput (w/o RadixAttention)
|
||||||
run: |
|
run: |
|
||||||
cd test/srt
|
cd test/srt
|
||||||
python3 -m unittest test_serving_throughput.TestServingThroughput.test_default_without_radix_cache
|
python3 -m unittest test_serving_throughput.TestServingThroughput.test_default_without_radix_cache
|
||||||
|
timeout-minutes: 10
|
||||||
|
|
||||||
- name: Benchmark Serving Throughput (w/ ChunkedPrefill)
|
- name: Benchmark Serving Throughput (w/ ChunkedPrefill)
|
||||||
run: |
|
run: |
|
||||||
cd test/srt
|
cd test/srt
|
||||||
python3 -m unittest test_serving_throughput.TestServingThroughput.test_default_with_chunked_prefill
|
python3 -m unittest test_serving_throughput.TestServingThroughput.test_default_with_chunked_prefill
|
||||||
|
timeout-minutes: 10
|
||||||
|
|||||||
15
.github/workflows/moe-test.yml
vendored
15
.github/workflows/moe-test.yml
vendored
@@ -6,11 +6,13 @@ on:
|
|||||||
paths:
|
paths:
|
||||||
- "python/sglang/**"
|
- "python/sglang/**"
|
||||||
- "test/**"
|
- "test/**"
|
||||||
|
- ".github/workflows/moe-test.yml"
|
||||||
pull_request:
|
pull_request:
|
||||||
branches: [ main ]
|
branches: [ main ]
|
||||||
paths:
|
paths:
|
||||||
- "python/sglang/**"
|
- "python/sglang/**"
|
||||||
- "test/**"
|
- "test/**"
|
||||||
|
- ".github/workflows/moe-test.yml"
|
||||||
workflow_dispatch:
|
workflow_dispatch:
|
||||||
|
|
||||||
concurrency:
|
concurrency:
|
||||||
@@ -36,7 +38,12 @@ jobs:
|
|||||||
pip install flashinfer -i https://flashinfer.ai/whl/cu121/torch2.4/ --force-reinstall
|
pip install flashinfer -i https://flashinfer.ai/whl/cu121/torch2.4/ --force-reinstall
|
||||||
|
|
||||||
- name: Benchmark MOE Serving Throughput
|
- name: Benchmark MOE Serving Throughput
|
||||||
run: |
|
uses: nick-fields/retry@v3
|
||||||
cd test/srt
|
with:
|
||||||
python3 -m unittest test_moe_serving_throughput.TestServingThroughput.test_default
|
timeout_minutes: 15
|
||||||
python3 -m unittest test_moe_serving_throughput.TestServingThroughput.test_default_without_radix_cache
|
max_attempts: 2
|
||||||
|
retry_on: error
|
||||||
|
command: |
|
||||||
|
cd test/srt
|
||||||
|
python3 -m unittest test_moe_serving_throughput.TestServingThroughput.test_default
|
||||||
|
python3 -m unittest test_moe_serving_throughput.TestServingThroughput.test_default_without_radix_cache
|
||||||
|
|||||||
4
.github/workflows/unit-test.yml
vendored
4
.github/workflows/unit-test.yml
vendored
@@ -6,11 +6,13 @@ on:
|
|||||||
paths:
|
paths:
|
||||||
- "python/sglang/**"
|
- "python/sglang/**"
|
||||||
- "test/**"
|
- "test/**"
|
||||||
|
- ".github/workflows/unit-test.yml"
|
||||||
pull_request:
|
pull_request:
|
||||||
branches: [ main ]
|
branches: [ main ]
|
||||||
paths:
|
paths:
|
||||||
- "python/sglang/**"
|
- "python/sglang/**"
|
||||||
- "test/**"
|
- "test/**"
|
||||||
|
- ".github/workflows/unit-test.yml"
|
||||||
workflow_dispatch:
|
workflow_dispatch:
|
||||||
|
|
||||||
concurrency:
|
concurrency:
|
||||||
@@ -41,8 +43,10 @@ jobs:
|
|||||||
run: |
|
run: |
|
||||||
cd test/srt
|
cd test/srt
|
||||||
python3 run_suite.py --suite minimal
|
python3 run_suite.py --suite minimal
|
||||||
|
timeout-minutes: 15
|
||||||
|
|
||||||
- name: Test Frontend Language
|
- name: Test Frontend Language
|
||||||
run: |
|
run: |
|
||||||
cd test/lang
|
cd test/lang
|
||||||
python3 run_suite.py --suite minimal
|
python3 run_suite.py --suite minimal
|
||||||
|
timeout-minutes: 10
|
||||||
|
|||||||
@@ -73,7 +73,7 @@ class TestServingThroughput(unittest.TestCase):
|
|||||||
|
|
||||||
if os.getenv("SGLANG_IS_IN_CI", "false") == "true":
|
if os.getenv("SGLANG_IS_IN_CI", "false") == "true":
|
||||||
# A100 (PCIE) performance
|
# A100 (PCIE) performance
|
||||||
assert res["output_throughput"] > 950
|
assert res["output_throughput"] > 930
|
||||||
|
|
||||||
def test_default_without_radix_cache(self):
|
def test_default_without_radix_cache(self):
|
||||||
res = self.run_test(
|
res = self.run_test(
|
||||||
|
|||||||
Reference in New Issue
Block a user