{ "achieved_tflops_per_gpu": 4.887838957353747, "achieved_tflops_per_gpu_theoretical": 267.64446046303027, "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.2101859748363495, "mfu_percent": 0.4942203192470927, "mfu_percent_theoretical": 27.062129470478286, "total_flos": 2.402936079087829e+18, "train_loss": 0.2685813971707974, "train_runtime": 61451.9039, "train_samples_per_second": 1.267, "train_steps_per_second": 0.079, "valid_targets_mean": 2883.4, "valid_targets_min": 615 }