41 lines
1.0 KiB
YAML
41 lines
1.0 KiB
YAML
models:
|
|
- model: kyujinpy/Sakura-SOLAR-Instruct
|
|
parameters:
|
|
density: 1.0
|
|
weight: 1.0
|
|
- model: kyujinpy/Sakura-SOLRCA-Math-Instruct-DPO-v2
|
|
parameters:
|
|
density: 0.5
|
|
weight: [0.33, 0.4, 0.33]
|
|
- model: kyujinpy/Sakura-SOLRCA-Instruct-DPO
|
|
parameters:
|
|
density: [0.33, 0.45, 0.66]
|
|
weight: 0.66
|
|
merge_method: dare_ties
|
|
base_model: kyujinpy/Sakura-SOLAR-Instruct
|
|
parameters:
|
|
normalize: true
|
|
int8_mask: true
|
|
dtype: bfloat16
|
|
tokenizer_source : union
|
|
|
|
#slices:
|
|
# - sources:
|
|
# - model: upstage/SOLAR-10.7B-Instruct-v1.0
|
|
# layer_range: [0, 48]
|
|
# - model: beomi/OPEN-SOLAR-KO-10.7B
|
|
# layer_range: [0, 48]
|
|
## or, the equivalent models: syntax:
|
|
## models:
|
|
## - model: psmathur/orca_mini_v3_13b
|
|
## - model: garage-bAInd/Platypus2-13B
|
|
#merge_method: slerp
|
|
#base_model: upstage/SOLAR-10.7B-Instruct-v1.0
|
|
#parameters:
|
|
# t:
|
|
# - filter: self_attn
|
|
# value: [0, 0.5, 0.3, 0.7, 1]
|
|
# - filter: mlp
|
|
# value: [1, 0.5, 0.7, 0.3, 0]
|
|
# - value: 0.5 # fallback for rest of tensors
|
|
#dtype: float16 |