{ "arm": "think_phase3_rlmt", "config": "configs/generated/phase4b_sft_think_phase3.yaml", "checkpoint": "outputs/phase4b_rlmt_think_phase3/final.pt", "dtype": "bfloat16" }