diff --git a/.github/workflows/accuracy-test.yml b/.github/workflows/accuracy-test.yml index 9c8e7bfeb..16bb584f4 100644 --- a/.github/workflows/accuracy-test.yml +++ b/.github/workflows/accuracy-test.yml @@ -43,3 +43,4 @@ jobs: run: | cd test/srt python3 test_eval_accuracy_large.py + timeout-minutes: 20 diff --git a/test/srt/test_moe_serving_throughput.py b/test/srt/test_moe_serving_throughput.py index 6353e5099..da223e80b 100644 --- a/test/srt/test_moe_serving_throughput.py +++ b/test/srt/test_moe_serving_throughput.py @@ -31,7 +31,7 @@ class TestServingThroughput(unittest.TestCase): ) # Run benchmark - num_prompts = 400 + num_prompts = 200 args = SimpleNamespace( backend="sglang", base_url=base_url,