{ "epoch": 1.0, "eval_loss": 0.48741263151168823, "eval_runtime": 140.0059, "eval_samples_per_second": 2.693, "eval_steps_per_second": 0.679, "perplexity": 1.6280982754463373, "total_flos": 8.066906520991826e+17, "train_loss": 0.5547944433354423, "train_runtime": 22221.3478, "train_samples_per_second": 0.831, "train_steps_per_second": 0.052 }