{ "epoch": 3.0, "total_flos": 4.271915416263066e+16, "train_loss": 0.3954192769085303, "train_runtime": 93126.1025, "train_samples_per_second": 70.83, "train_steps_per_second": 0.069 }