Files
qwen3-8b-base-beta-dpo-hh-h…/all_results.json
ModelHub XC 527c912d5f 初始化项目,由ModelHub XC社区提供模型
Model: jackf857/qwen3-8b-base-beta-dpo-hh-harmless-4xh200-batch-64-20260424-025105
Source: Original Platform
2026-05-16 07:03:57 +08:00

21 lines
739 B
JSON

{
"epoch": 0.999244142101285,
"eval_beta_dpo/beta_used": 0.1372366100549698,
"eval_beta_dpo/beta_used_raw": 0.10684214532375336,
"eval_beta_dpo/gap_mean": 11.190993309020996,
"eval_beta_dpo/gap_std": 18.76331901550293,
"eval_beta_dpo/mask_keep_frac": 1.0,
"eval_logits/chosen": 1.3944156169891357,
"eval_logits/rejected": 1.2692357301712036,
"eval_loss": 0.6537412405014038,
"eval_runtime": 42.4848,
"eval_samples": 2303,
"eval_samples_per_second": 54.208,
"eval_steps_per_second": 1.695,
"total_flos": 0.0,
"train_loss": 1.1663504292943294,
"train_runtime": 3087.1314,
"train_samples": 42336,
"train_samples_per_second": 13.714,
"train_steps_per_second": 0.214
}