Enable MLA by default (#1447)

This commit is contained in:
Ke Bao
2024-09-17 19:42:48 +08:00
committed by GitHub
parent 90a26be31c
commit c6b6d2e71b
8 changed files with 16 additions and 18 deletions

View File

@@ -52,7 +52,7 @@ class TestEvalAccuracyLarge(unittest.TestCase):
if is_tp2:
other_args.extend(["--tp", "2"])
if "DeepSeek" in model:
other_args.extend(["--enable-mla", "--mem-frac", "0.85"])
other_args.extend(["--mem-frac", "0.85"])
self.process = popen_launch_server(
model,