{ | |
"epoch": 30.0, | |
"eval_accuracy": 0.5187187058672487, | |
"eval_loss": 2.996563196182251, | |
"eval_runtime": 30.3359, | |
"eval_samples": 4053, | |
"eval_samples_per_second": 133.604, | |
"eval_steps_per_second": 33.426, | |
"perplexity": 20.01662535880206, | |
"total_flos": 1.5839169150106368e+17, | |
"train_loss": 0.47119966579742084, | |
"train_runtime": 6930.0607, | |
"train_samples": 80219, | |
"train_samples_per_second": 347.265, | |
"train_steps_per_second": 21.705 | |
} |