Use only one GPU for MLA CI tests (#2858)
This commit is contained in:
@@ -21,8 +21,6 @@ class TestMLA(unittest.TestCase):
|
||||
cls.base_url,
|
||||
timeout=DEFAULT_TIMEOUT_FOR_SERVER_LAUNCH,
|
||||
other_args=[
|
||||
"--tp",
|
||||
"2",
|
||||
"--trust-remote-code",
|
||||
"--kv-cache-dtype",
|
||||
"fp8_e5m2",
|
||||
|
||||
Reference in New Issue
Block a user