Files
qwen-2.5-7B-Resta-lr3e-5-sc…/mergekit_config.yml

22 lines
430 B
YAML
Raw Permalink Normal View History

dtype: float16
merge_method: linear
slices:
- sources:
- layer_range: [0, 28]
model:
model:
path: wvnvwn/qwen-2.5-7B-SSFT-gsm8k-lr3e-5
parameters:
weight: 1.0
- layer_range: [0, 28]
model:
model:
path: wvnvwn/qwen-2.5-7B-SSFT-lr3e-5
parameters:
weight: 0.5
- layer_range: [0, 28]
model:
model:
path: Qwen/Qwen2.5-7B
parameters:
weight: -0.5