Model: Support Qwen 72B RM model. (#3772)
This commit is contained in:
@@ -379,6 +379,8 @@ class Qwen2ForCausalLM(nn.Module):
|
||||
continue
|
||||
if name.startswith("model.vision_tower") and name not in params_dict:
|
||||
continue
|
||||
if name.startswith("lm_head"):
|
||||
continue
|
||||
|
||||
for param_name, weight_name, shard_id in stacked_params_mapping:
|
||||
if weight_name not in name:
|
||||
|
||||
Reference in New Issue
Block a user