初始化项目,由ModelHub XC社区提供模型
Model: abeja/ABEJA-Qwen3-14B-Agentic-256k-v0.1 Source: Original Platform
This commit is contained in:
12
recipe.yml
Normal file
12
recipe.yml
Normal file
@@ -0,0 +1,12 @@
|
||||
device_map: cpu # Only `auto`, `cpu`, or `cuda` are supported
|
||||
dtype: bfloat16
|
||||
trust_remote_code: true
|
||||
copy_tokenizer: true
|
||||
input_models:
|
||||
- path: /data/models/hf/experiments/rl_egov_search/run_016_qwen3_egov_restart_from011s130_5e_7_gspo_step_30
|
||||
weight: 1
|
||||
- path: /data/models/hf/experiments/rl_wiki_search/run_047_qwen3_base043_250s_add_tool_desc_simple_step_60
|
||||
weight: 1
|
||||
- path: /data/models/hf/experiments/rl_wiki_deepresearch/run_023_qwen3_deepresearch_retrain_from_021s20_add_think_reward_step_150
|
||||
weight: 1
|
||||
output_path: /data/models/hf/experiments/rl_model_soup/qwen3_soup_egov016_wiki047_deep023
|
||||
Reference in New Issue
Block a user