{ "epoch": 79.0, "learning_rate": 1.0000000000000002e-06, "total_flos": 8.188406191467658e+19, "train_loss": 0.4591466036709872, "train_runtime": 19731.8487, "train_samples_per_second": 53.236, "train_steps_per_second": 0.836 }