model: Support nvidia/Llama-3_1-Nemotron-Ultra-253B-v1 (#9301)

2025-08-26 10:33:40 +03:00
parent f92b729d52
commit 4cd08dc592
2 changed files with 7 additions and 0 deletions
--- a/test/srt/models/test_generation_models.py
+++ b/test/srt/models/test_generation_models.py
@@ -83,6 +83,12 @@ ALL_MODELS = [
        trust_remote_code=True,
        skip_long_prompt=True,
    ),
+    ModelCase(
+        "nvidia/Llama-3_1-Nemotron-Ultra-253B-v1",
+        tp_size=8,
+        trust_remote_code=True,
+        skip_long_prompt=True,
+    ),
 ]

 TORCH_DTYPES = [torch.float16]