{ "achieved_tflops_per_gpu": 0.003467667592250595, "achieved_tflops_per_gpu_theoretical": 386.2211201618412, "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.3168274760246277, "mfu_percent": 0.000245064847508876, "mfu_percent_theoretical": 27.294778810024116, "total_flos": 1987075207921664.0, "train_loss": 0.31482745524102407, "train_runtime": 35814.3326, "train_samples_per_second": 1.821, "train_steps_per_second": 0.114, "valid_targets_mean": 9725.1, "valid_targets_min": 6847 }