{ "epoch": 2.54, "eval_accuracy": 0.46849419452203217, "eval_loss": 3.0123162269592285, "eval_runtime": 1485.7627, "eval_samples": 308356, "eval_samples_per_second": 207.541, "eval_steps_per_second": 3.243, "perplexity": 20.334444609931378, "train_loss": 4.630338809797302, "train_runtime": 197999.0445, "train_samples": 5858758, "train_samples_per_second": 2958.983, "train_steps_per_second": 46.235 }