{ "epoch": 2.0, "total_flos": 2.85249316814848e+16, "train_loss": 0.8500257841618516, "train_runtime": 594460.0391, "train_samples": 4779894, "train_samples_per_second": 3.624, "train_steps_per_second": 0.028 }