{ "epoch": 50.53, "eval_loss": 2.259847640991211, "eval_runtime": 48.3465, "eval_samples": 40000, "eval_samples_per_second": 827.361, "eval_steps_per_second": 51.71, "perplexity": 9.58162920801955, "train_loss": 2.392315192057292, "train_runtime": 173434.012, "train_samples": 760001, "train_samples_per_second": 221.41, "train_steps_per_second": 13.838 }