Model: jackf857/llama-3-8b-base-slic-hf-ultrafeedback-4xh200-batch-128-20260428-054623 Source: Original Platform
24 lines
878 B
JSON
24 lines
878 B
JSON
{
|
|
"epoch": 0.9989528795811519,
|
|
"eval_logits/chosen": -0.6059221029281616,
|
|
"eval_logits/rejected": -0.612111508846283,
|
|
"eval_logps/chosen": -260.80767822265625,
|
|
"eval_logps/rejected": -247.20326232910156,
|
|
"eval_loss": 341.7586364746094,
|
|
"eval_rewards/accuracies": 0.49399998784065247,
|
|
"eval_rewards/chosen": -260.80767822265625,
|
|
"eval_rewards/margins": -13.604412078857422,
|
|
"eval_rewards/rejected": -247.20326232910156,
|
|
"eval_runtime": 42.3358,
|
|
"eval_samples": 2000,
|
|
"eval_samples_per_second": 47.241,
|
|
"eval_slic/ce_loss": 260.80767822265625,
|
|
"eval_slic/rank_loss": 80.95094299316406,
|
|
"eval_steps_per_second": 2.953,
|
|
"total_flos": 0.0,
|
|
"train_loss": 2803.1413415552934,
|
|
"train_runtime": 5510.6328,
|
|
"train_samples": 61135,
|
|
"train_samples_per_second": 11.094,
|
|
"train_steps_per_second": 0.087
|
|
} |