From 5317902670fcedc59861b41e1fa36a49866495db Mon Sep 17 00:00:00 2001 From: Ke Bao Date: Sat, 1 Feb 2025 16:07:54 +0800 Subject: [PATCH] Add test for fp8 torch compile (#3246) --- test/srt/test_mla.py | 7 ++++++- 1 file changed, 6 insertions(+), 1 deletion(-) diff --git a/test/srt/test_mla.py b/test/srt/test_mla.py index 34bc4b446..630573250 100644 --- a/test/srt/test_mla.py +++ b/test/srt/test_mla.py @@ -62,7 +62,12 @@ class TestDeepseekV3(unittest.TestCase): cls.model, cls.base_url, timeout=DEFAULT_TIMEOUT_FOR_SERVER_LAUNCH, - other_args=["--trust-remote-code"], + other_args=[ + "--trust-remote-code", + "--enable-torch-compile", + "--cuda-graph-max-bs", + "2", + ], ) @classmethod