diff --git a/test/srt/test_bench_serving.py b/test/srt/test_bench_serving.py index 8233438fc..b0c6dcd19 100644 --- a/test/srt/test_bench_serving.py +++ b/test/srt/test_bench_serving.py @@ -153,6 +153,8 @@ class TestBenchServing(unittest.TestCase): "64", "--mem-fraction-static", "0.7", + "--cuda-graph-max-bs", + "32", ], )