{ "epoch": 3.0, "eval_loss": 2.030430555343628, "eval_runtime": 15.4256, "eval_samples": 1000, "eval_samples_per_second": 64.827, "eval_steps_per_second": 8.103, "perplexity": 7.617365350191575, "train_loss": 2.1000711460306185, "train_runtime": 3427.7755, "train_samples": 19004, "train_samples_per_second": 16.632, "train_steps_per_second": 0.26 }