25 lines
794 B
YAML
25 lines
794 B
YAML
architecture: MistralForCausalLM
|
|
base_model: B:/12B/MuXodious--Mistral-Nemo-Instruct-2407-absolute-heresy # mistralai--Mistral-Nemo-Instruct-2407
|
|
models:
|
|
- model: B:/12B/EldritchLabs--MN-12B-RP-Ink-Longform-MPOA
|
|
parameters:
|
|
weight: 1.0
|
|
- model: B:/12B/EldritchLabs--Human-Like-Mistral-Nemo-Instruct-2407-MPOA
|
|
parameters:
|
|
weight: 1.0
|
|
- model: B:/12B/MuXodious-Rocinante-X-12B-v1-absolute-heresy # TheDrummer--Rocinante-X-12B-v1
|
|
parameters:
|
|
weight: 1.0
|
|
merge_method: karcher_stock # v12B
|
|
parameters:
|
|
filter_wise: true
|
|
max_iter: 25
|
|
min_iter: 10
|
|
tol: 1.0e-9
|
|
magnitude_mean_geometric: false # TRUE makes it 75% karcher
|
|
dtype: float32
|
|
out_dtype: bfloat16
|
|
tokenizer:
|
|
source: union
|
|
chat_template: auto
|
|
name: karcher_stock_12b_v1 |