model: Support nvidia/Llama-3_1-Nemotron-Ultra-253B-v1 (#9301)

This commit is contained in:
Netanel Haber
2025-08-26 10:33:40 +03:00
committed by GitHub
parent f92b729d52
commit 4cd08dc592
2 changed files with 7 additions and 0 deletions

View File

@@ -83,6 +83,12 @@ ALL_MODELS = [
trust_remote_code=True,
skip_long_prompt=True,
),
ModelCase(
"nvidia/Llama-3_1-Nemotron-Ultra-253B-v1",
tp_size=8,
trust_remote_code=True,
skip_long_prompt=True,
),
]
TORCH_DTYPES = [torch.float16]