[ROCm] Enable MTP (NextN) on AMD GPU (#4631)

This commit is contained in:
Alex Sun
2025-03-24 13:58:05 +08:00
committed by GitHub
parent 93cf7fc5cd
commit af6535e7aa
7 changed files with 43 additions and 4 deletions

View File

@@ -54,7 +54,7 @@ class TestDeepseekV3MTP(unittest.TestCase):
cls.model = "lmsys/sglang-ci-dsv3-test"
cls.base_url = DEFAULT_URL_FOR_TEST
other_args = ["--trust-remote-code"]
if torch.cuda.is_available() and torch.version.cuda:
if torch.cuda.is_available() and (torch.version.cuda or torch.version.hip):
other_args.extend(
[
"--cuda-graph-max-bs",