Fix GPU OOM (#6564)

Co-authored-by: michael <michael.zhang@amd.com>
This commit is contained in:
kk
2025-05-25 07:38:39 +08:00
committed by GitHub
parent 24c035f2e3
commit 7a5e6ce1cb
8 changed files with 15 additions and 16 deletions

View File

@@ -90,9 +90,9 @@ class TestDeepseekV3MTP(CustomTestCase):
"2",
"--speculative-num-draft-tokens",
"4",
"--mem-fraction-static",
"0.7",
]
if os.environ.get("SGLANG_AMD_CI") != "1":
other_args += ["--mem-frac", "0.7"]
cls.process = popen_launch_server(
cls.model,
cls.base_url,