26 lines
933 B
JSON
26 lines
933 B
JSON
|
|
{
|
||
|
|
"model_name": "Qwen/Qwen2.5-0.5B-Instruct",
|
||
|
|
"condition": "single_m",
|
||
|
|
"participant_info": "/tmp/brainrl-data/configs/participant_run_info.json",
|
||
|
|
"train_subjects": "sub-01:sub-20",
|
||
|
|
"test_subjects": "sub-21:sub-26",
|
||
|
|
"exclude_subjects": "sub-03,sub-18",
|
||
|
|
"seed": 42,
|
||
|
|
"max_steps": 600,
|
||
|
|
"num_prompts": 128,
|
||
|
|
"train_prompt_top_k": 16,
|
||
|
|
"per_device_train_batch_size": 8,
|
||
|
|
"num_generations": 8,
|
||
|
|
"reward_delta_scale": 5.0,
|
||
|
|
"duplicate_action_penalty": 0.1,
|
||
|
|
"data_repo": "Mohith202/brainrl-config-data",
|
||
|
|
"data_revision": "main",
|
||
|
|
"env_url": null,
|
||
|
|
"config_dir": "/tmp/brainrl-data/configs",
|
||
|
|
"parcel_manifest": "/tmp/brainrl-data/configs/parcel_candidates.json",
|
||
|
|
"parcel_manifest_sha256": "d68a07e049750636e52727ed23cfc717500835ec2cc301102e29163495bbe77b",
|
||
|
|
"sequential_state_fraction": 0.5,
|
||
|
|
"sequential_state_min_prefix": 1,
|
||
|
|
"sequential_state_max_prefix": 10,
|
||
|
|
"sequential_state_exploration_eps": 0.25
|
||
|
|
}
|