{ "epoch": 3.0, "eval_loss": 1.2680052518844604, "eval_runtime": 37.3047, "eval_samples_per_second": 10.32, "eval_steps_per_second": 2.6, "perplexity": 3.553756638060757, "total_flos": 234145141751808.0, "train_loss": 1.2264163225196905, "train_runtime": 4742.9935, "train_samples_per_second": 24.104, "train_steps_per_second": 0.753 }