device_map: cpu # Only `auto`, `cpu`, or `cuda` are supported dtype: bfloat16 trust_remote_code: true copy_tokenizer: true input_models: - path: /data/models/hf/experiments/rl_egov_search/run_016_qwen3_egov_restart_from011s130_5e_7_gspo_step_30 weight: 1 - path: /data/models/hf/experiments/rl_wiki_search/run_047_qwen3_base043_250s_add_tool_desc_simple_step_60 weight: 1 - path: /data/models/hf/experiments/rl_wiki_deepresearch/run_023_qwen3_deepresearch_retrain_from_021s20_add_think_reward_step_150 weight: 1 output_path: /data/models/hf/experiments/rl_model_soup/qwen3_soup_egov016_wiki047_deep023