Files
exp-syh-tezos-askllm-harden…/train_results.json

16 lines
544 B
JSON
Raw Normal View History

{
"achieved_tflops_per_gpu": 4.937536133249764,
"achieved_tflops_per_gpu_theoretical": 226.98960570915227,
"epoch": 7.0,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08761073648929596,
"mfu_percent": 0.4992453117542734,
"mfu_percent_theoretical": 22.951426259772727,
"total_flos": 2.474107676200534e+18,
"train_loss": 0.24594933182050951,
"train_runtime": 62635.179,
"train_samples_per_second": 1.069,
"train_steps_per_second": 0.067,
"valid_targets_mean": 11621.8,
"valid_targets_min": 3550
}