Add test for fp8 torch compile (#3246)

This commit is contained in:
Ke Bao
2025-02-01 16:07:54 +08:00
committed by GitHub
parent d7c0b32f4d
commit 5317902670

View File

@@ -62,7 +62,12 @@ class TestDeepseekV3(unittest.TestCase):
cls.model,
cls.base_url,
timeout=DEFAULT_TIMEOUT_FOR_SERVER_LAUNCH,
other_args=["--trust-remote-code"],
other_args=[
"--trust-remote-code",
"--enable-torch-compile",
"--cuda-graph-max-bs",
"2",
],
)
@classmethod