{ "achieved_tflops_per_gpu": 0.004033428420429949, "achieved_tflops_per_gpu_theoretical": 467.53082966959727, "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.20417048037052155, "mfu_percent": 0.0002850479449067102, "mfu_percent_theoretical": 33.04104803318709, "total_flos": 1952534555328512.0, "train_loss": 0.3077526548922005, "train_runtime": 30255.504, "train_samples_per_second": 2.205, "train_steps_per_second": 0.138, "valid_targets_mean": 6589.3, "valid_targets_min": 3933 }