Files
super-model-7b/mergekit_config.yml

19 lines
363 B
YAML
Raw Normal View History

models:
- model: Qwen/Qwen2.5-7B-Instruct
parameters:
weight: 0.3
- model: Qwen/Qwen2.5-Coder-7B-Instruct
parameters:
weight: 0.4
- model: deepseek-ai/DeepSeek-R1-Distill-Qwen-7B
parameters:
weight: 0.3
merge_method: dare_ties
base_model: Qwen/Qwen2.5-7B-Instruct
parameters:
density: 0.8
normalize: true
dtype: bfloat16