Support LingV2 model (#10359)
Co-authored-by: 羽癫 <yudian.zy@antgroup.com> Co-authored-by: guoyuhong <yuhong.gyh@antgroup.com>
This commit is contained in:
@@ -754,7 +754,12 @@ class ServerArgs:
|
||||
)
|
||||
|
||||
model_arch = self.get_hf_config().architectures[0]
|
||||
if model_arch in ["DeepseekV3ForCausalLM", "Glm4MoeForCausalLM"]:
|
||||
if model_arch in [
|
||||
"DeepseekV3ForCausalLM",
|
||||
"Glm4MoeForCausalLM",
|
||||
"BailingMoeV2ForCausalLM",
|
||||
"BailingMoeV2ForCausalLM",
|
||||
]:
|
||||
# Auto set draft_model_path DeepSeek-V3/R1
|
||||
if self.speculative_draft_model_path is None:
|
||||
self.speculative_draft_model_path = self.model_path
|
||||
@@ -2724,6 +2729,8 @@ def auto_choose_speculative_params(self: ServerArgs):
|
||||
"DeepseekV3ForCausalLM",
|
||||
"DeepseekV2ForCausalLM",
|
||||
"GptOssForCausalLM",
|
||||
"BailingMoeForCausalLM",
|
||||
"BailingMoeV2ForCausalLM",
|
||||
]:
|
||||
# The default value for deepseek and gpt-oss
|
||||
return (3, 1, 4)
|
||||
|
||||
Reference in New Issue
Block a user