{ "epoch": 20.0, "eval_accuracy": 0.1432211125795332, "eval_loss": 6.276556968688965, "eval_runtime": 5.1628, "eval_samples": 963, "eval_samples_per_second": 186.528, "eval_steps_per_second": 11.815, "perplexity": 531.9539730039461, "total_flos": 1.513744687742976e+16, "train_loss": 3.172654545207319, "train_runtime": 2061.7586, "train_samples": 19092, "train_samples_per_second": 185.201, "train_steps_per_second": 5.791 }