21 lines
480 B
YAML
21 lines
480 B
YAML
|
|
base_model: Qwen/Qwen2.5-7B-Instruct
|
||
|
|
dtype: float16
|
||
|
|
merge_method: breadcrumbs
|
||
|
|
modules:
|
||
|
|
default:
|
||
|
|
slices:
|
||
|
|
- sources:
|
||
|
|
- layer_range: [0, 28]
|
||
|
|
model: Alelcv27/Qwen2.5-7B-Math-CoT
|
||
|
|
parameters:
|
||
|
|
weight: 0.8
|
||
|
|
- layer_range: [0, 28]
|
||
|
|
model: Alelcv27/Qwen2.5-7B-Code-v2
|
||
|
|
parameters:
|
||
|
|
weight: 0.8
|
||
|
|
- layer_range: [0, 28]
|
||
|
|
model: Qwen/Qwen2.5-7B-Instruct
|
||
|
|
parameters:
|
||
|
|
density: 0.9
|
||
|
|
gamma: 0.01
|
||
|
|
normalize: 1.0
|