14 lines
363 B
YAML
14 lines
363 B
YAML
base_model: grimjim/Llama-3-Instruct-8B-SPPO-Iter3-SimPO-merge
|
|
dtype: bfloat16
|
|
merge_method: task_arithmetic
|
|
parameters:
|
|
normalize: false
|
|
slices:
|
|
- sources:
|
|
- layer_range: [0, 32]
|
|
model: grimjim/Llama-3-Instruct-8B-SPPO-Iter3-SimPO-merge
|
|
- layer_range: [0, 32]
|
|
model: tokyotech-llm/Llama-3-Swallow-8B-Instruct-v0.1
|
|
parameters:
|
|
weight: 0.1
|