forked from EngineX-Cambricon/enginex-mlu370-vllm
add deepseekv3
This commit is contained in:
@@ -565,7 +565,9 @@ def vllm__module_executor__models__deepseek_v2__DeepseekV2ForCausalLM__load_weig
|
||||
@brief: add expert skiped condition and delete useless if name not in params_dict: continue condition
|
||||
'''
|
||||
name = name.replace(weight_name, param_name)
|
||||
if (("mlp.experts." in name or "mlp.shared_experts." in name or "mlp.shared_expert_gate." in name)
|
||||
if (("mlp.experts." in name or "mlp.shared_experts." in name
|
||||
or "mlp.shared_expert_gate." in name
|
||||
or "e_score_correction_bias" in name)
|
||||
and name not in params_dict):
|
||||
continue
|
||||
'''
|
||||
@@ -595,7 +597,9 @@ def vllm__module_executor__models__deepseek_v2__DeepseekV2ForCausalLM__load_weig
|
||||
if name.endswith(".bias") and name not in params_dict:
|
||||
continue
|
||||
|
||||
if (("mlp.experts." in name or "mlp.shared_experts." in name or "mlp.shared_expert_gate." in name)
|
||||
if (("mlp.experts." in name or "mlp.shared_experts." in name
|
||||
or "mlp.shared_expert_gate." in name
|
||||
or "e_score_correction_bias" in name)
|
||||
and name not in params_dict):
|
||||
continue
|
||||
if is_pp_missing_parameter(name, self):
|
||||
|
||||
Reference in New Issue
Block a user