18 lines
415 B
YAML
18 lines
415 B
YAML
|
|
slices:
|
|
- sources:
|
|
- model: shanchen/llama3-8B-slerp-med-chinese
|
|
layer_range: [0,32]
|
|
- model: shenzhi-wang/Llama3-8B-Chinese-Chat
|
|
layer_range: [0,32]
|
|
merge_method: slerp
|
|
base_model: shenzhi-wang/Llama3-8B-Chinese-Chat
|
|
parameters:
|
|
t:
|
|
- filter: self_attn
|
|
value: [0.3, 0.5, 0.5, 0.7, 1]
|
|
- filter: mlp
|
|
value: [1, 0.7, 0.5, 0.5, 0.3]
|
|
- value: 0.5
|
|
dtype: bfloat16
|