16 lines
586 B
JSON
16 lines
586 B
JSON
{
|
|
"epoch": 0.9981298423724285,
|
|
"eval_logits/chosen": -1.3243151903152466,
|
|
"eval_logits/rejected": -1.3434444665908813,
|
|
"eval_logps/chosen": -726.5227661132812,
|
|
"eval_logps/rejected": -886.8052368164062,
|
|
"eval_loss": 0.3820632994174957,
|
|
"eval_rewards/accuracies": 0.8669354915618896,
|
|
"eval_rewards/chosen": -4.470167636871338,
|
|
"eval_rewards/margins": 1.6623308658599854,
|
|
"eval_rewards/rejected": -6.132497787475586,
|
|
"eval_runtime": 127.0737,
|
|
"eval_samples": 1961,
|
|
"eval_samples_per_second": 15.432,
|
|
"eval_steps_per_second": 0.488
|
|
} |