Files
llama-3-Nephilim-v3-8B/mergekit_config.yml

14 lines
363 B
YAML
Raw Normal View History

base_model: grimjim/Llama-3-Instruct-8B-SPPO-Iter3-SimPO-merge
dtype: bfloat16
merge_method: task_arithmetic
parameters:
normalize: false
slices:
- sources:
- layer_range: [0, 32]
model: grimjim/Llama-3-Instruct-8B-SPPO-Iter3-SimPO-merge
- layer_range: [0, 32]
model: tokyotech-llm/Llama-3-Swallow-8B-Instruct-v0.1
parameters:
weight: 0.1