add deepseekv3
This commit is contained in:
@@ -565,7 +565,9 @@ def vllm__module_executor__models__deepseek_v2__DeepseekV2ForCausalLM__load_weig
|
|||||||
@brief: add expert skiped condition and delete useless if name not in params_dict: continue condition
|
@brief: add expert skiped condition and delete useless if name not in params_dict: continue condition
|
||||||
'''
|
'''
|
||||||
name = name.replace(weight_name, param_name)
|
name = name.replace(weight_name, param_name)
|
||||||
if (("mlp.experts." in name or "mlp.shared_experts." in name or "mlp.shared_expert_gate." in name)
|
if (("mlp.experts." in name or "mlp.shared_experts." in name
|
||||||
|
or "mlp.shared_expert_gate." in name
|
||||||
|
or "e_score_correction_bias" in name)
|
||||||
and name not in params_dict):
|
and name not in params_dict):
|
||||||
continue
|
continue
|
||||||
'''
|
'''
|
||||||
@@ -595,7 +597,9 @@ def vllm__module_executor__models__deepseek_v2__DeepseekV2ForCausalLM__load_weig
|
|||||||
if name.endswith(".bias") and name not in params_dict:
|
if name.endswith(".bias") and name not in params_dict:
|
||||||
continue
|
continue
|
||||||
|
|
||||||
if (("mlp.experts." in name or "mlp.shared_experts." in name or "mlp.shared_expert_gate." in name)
|
if (("mlp.experts." in name or "mlp.shared_experts." in name
|
||||||
|
or "mlp.shared_expert_gate." in name
|
||||||
|
or "e_score_correction_bias" in name)
|
||||||
and name not in params_dict):
|
and name not in params_dict):
|
||||||
continue
|
continue
|
||||||
if is_pp_missing_parameter(name, self):
|
if is_pp_missing_parameter(name, self):
|
||||||
|
|||||||
Reference in New Issue
Block a user