{ | |
"epoch": 19.990992729846234, | |
"eval_accuracy": 0.43054403912594785, | |
"eval_loss": 2.910346746444702, | |
"eval_runtime": 112.5282, | |
"eval_samples": 52440, | |
"eval_samples_per_second": 466.016, | |
"eval_steps_per_second": 7.287, | |
"perplexity": 18.36316482533208, | |
"total_flos": 1.298988775636992e+18, | |
"train_loss": 3.0016495520987547, | |
"train_runtime": 41094.0958, | |
"train_samples": 497364, | |
"train_samples_per_second": 242.061, | |
"train_steps_per_second": 0.945 | |
} |