model: Support nvidia/Llama-3_1-Nemotron-Ultra-253B-v1 (#9301)
This commit is contained in:
@@ -83,6 +83,12 @@ ALL_MODELS = [
|
||||
trust_remote_code=True,
|
||||
skip_long_prompt=True,
|
||||
),
|
||||
ModelCase(
|
||||
"nvidia/Llama-3_1-Nemotron-Ultra-253B-v1",
|
||||
tp_size=8,
|
||||
trust_remote_code=True,
|
||||
skip_long_prompt=True,
|
||||
),
|
||||
]
|
||||
|
||||
TORCH_DTYPES = [torch.float16]
|
||||
|
||||
Reference in New Issue
Block a user