Files
ChimeraLlama-3-8B-v3/mergekit_config.yml

38 lines
931 B
YAML
Raw Normal View History

models:
- model: NousResearch/Meta-Llama-3-8B
# No parameters necessary for base model
- model: NousResearch/Meta-Llama-3-8B-Instruct
parameters:
density: 0.6
weight: 0.5
- model: mlabonne/OrpoLlama-3-8B
parameters:
density: 0.55
weight: 0.05
- model: cognitivecomputations/dolphin-2.9-llama3-8b
parameters:
density: 0.55
weight: 0.05
- model: Danielbrdz/Barcenas-Llama3-8b-ORPO
parameters:
density: 0.55
weight: 0.2
- model: VAGOsolutions/Llama-3-SauerkrautLM-8b-Instruct
parameters:
density: 0.55
weight: 0.1
- model: vicgalle/Configurable-Llama-3-8B-v0.3
parameters:
density: 0.55
weight: 0.05
- model: MaziyarPanahi/Llama-3-8B-Instruct-DPO-v0.3
parameters:
density: 0.55
weight: 0.05
merge_method: dare_ties
base_model: NousResearch/Meta-Llama-3-8B
parameters:
int8_mask: true
dtype: float16