{ "epoch": 0.4, "eval_loss": 1.0858668088912964, "eval_runtime": 2658.3456, "eval_samples": 5000, "eval_samples_per_second": 9.435, "eval_steps_per_second": 4.718, "perplexity": 2.9620061996078197, "train_loss": 1.1317986328125, "train_runtime": 62833.7719, "train_samples": 100000, "train_samples_per_second": 3.183, "train_steps_per_second": 0.398 }