{ "epoch": 2.87, "eval_loss": 8.360694885253906, "eval_runtime": 47.1861, "eval_samples": 8752, "eval_samples_per_second": 185.478, "eval_steps_per_second": 11.592, "perplexity": 4275.664830790565, "train_loss": 9.417760696411133, "train_runtime": 4915.0289, "train_samples": 142865, "train_samples_per_second": 83.336, "train_steps_per_second": 0.02 }