{ "achieved_tflops_per_gpu": 0.003934338055156972, "achieved_tflops_per_gpu_theoretical": 464.14292510677404, "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.25985902547836304, "mfu_percent": 0.0002780450922372418, "mfu_percent_theoretical": 32.801620148888624, "total_flos": 2042313493250048.0, "train_loss": 0.3067965584114964, "train_runtime": 32443.7279, "train_samples_per_second": 2.185, "train_steps_per_second": 0.137, "valid_targets_mean": 4442.9, "valid_targets_min": 1017 }