Feat: Support Phi-3.5-MoE in SGLang (#7907)

This commit is contained in:
Binyao Jiang
2025-07-09 23:51:33 -07:00
committed by GitHub
parent b5e3d6031c
commit 2d54d4bb64
3 changed files with 560 additions and 1 deletions

View File

@@ -68,6 +68,12 @@ ALL_MODELS = [
ModelCase("microsoft/Phi-3-small-8k-instruct", trust_remote_code=True),
ModelCase("allenai/OLMo-2-1124-7B-Instruct", skip_long_prompt=True),
ModelCase("ibm-granite/granite-3.0-2b-instruct", skip_long_prompt=True),
ModelCase(
"microsoft/Phi-3.5-MoE-instruct",
tp_size=2,
trust_remote_code=True,
skip_long_prompt=True,
),
]
TORCH_DTYPES = [torch.float16]