Files
a1-wizardlm_orca/train_results.json

16 lines
544 B
JSON
Raw Permalink Normal View History

{
"achieved_tflops_per_gpu": 0.0028883878665412407,
"achieved_tflops_per_gpu_theoretical": 985.8802277815419,
"epoch": 7.0,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25369924306869507,
"mfu_percent": 0.00020412635099231386,
"mfu_percent_theoretical": 69.67351433085102,
"total_flos": 644683152949248.0,
"train_loss": 0.3271850697072269,
"train_runtime": 13949.8914,
"train_samples_per_second": 4.655,
"train_steps_per_second": 0.291,
"valid_targets_mean": 2212.8,
"valid_targets_min": 431
}