{ "achieved_tflops_per_gpu": 0.005310423151959063, "achieved_tflops_per_gpu_theoretical": 704.6841490672189, "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.21552443504333496, "mfu_percent": 0.00037529492239993375, "mfu_percent_theoretical": 49.800999934079066, "total_flos": 1717709353779200.0, "train_loss": 0.15650485047922919, "train_runtime": 20216.2486, "train_samples_per_second": 3.333, "train_steps_per_second": 0.208, "valid_targets_mean": 5110.8, "valid_targets_min": 529 }