Files
ABEJA-Qwen3-14B-Agentic-256…/recipe.yml

13 lines
632 B
YAML
Raw Normal View History

device_map: cpu # Only `auto`, `cpu`, or `cuda` are supported
dtype: bfloat16
trust_remote_code: true
copy_tokenizer: true
input_models:
- path: /data/models/hf/experiments/rl_egov_search/run_016_qwen3_egov_restart_from011s130_5e_7_gspo_step_30
weight: 1
- path: /data/models/hf/experiments/rl_wiki_search/run_047_qwen3_base043_250s_add_tool_desc_simple_step_60
weight: 1
- path: /data/models/hf/experiments/rl_wiki_deepresearch/run_023_qwen3_deepresearch_retrain_from_021s20_add_think_reward_step_150
weight: 1
output_path: /data/models/hf/experiments/rl_model_soup/qwen3_soup_egov016_wiki047_deep023