Support LingV2 model (#10359)

Co-authored-by: 羽癫 <yudian.zy@antgroup.com>
Co-authored-by: guoyuhong <yuhong.gyh@antgroup.com>
This commit is contained in:
strgrb
2025-09-12 14:53:52 +08:00
committed by GitHub
parent b3839a7f99
commit fac07c9b08
7 changed files with 1189 additions and 245 deletions

View File

@@ -754,7 +754,12 @@ class ServerArgs:
)
model_arch = self.get_hf_config().architectures[0]
if model_arch in ["DeepseekV3ForCausalLM", "Glm4MoeForCausalLM"]:
if model_arch in [
"DeepseekV3ForCausalLM",
"Glm4MoeForCausalLM",
"BailingMoeV2ForCausalLM",
"BailingMoeV2ForCausalLM",
]:
# Auto set draft_model_path DeepSeek-V3/R1
if self.speculative_draft_model_path is None:
self.speculative_draft_model_path = self.model_path
@@ -2724,6 +2729,8 @@ def auto_choose_speculative_params(self: ServerArgs):
"DeepseekV3ForCausalLM",
"DeepseekV2ForCausalLM",
"GptOssForCausalLM",
"BailingMoeForCausalLM",
"BailingMoeV2ForCausalLM",
]:
# The default value for deepseek and gpt-oss
return (3, 1, 4)