{ | |
"epoch": 24.0, | |
"eval_accuracy": 0.4202126468521879, | |
"eval_loss": 2.989222764968872, | |
"eval_runtime": 111.6132, | |
"eval_samples": 52190, | |
"eval_samples_per_second": 467.597, | |
"eval_steps_per_second": 7.311, | |
"perplexity": 19.870232647372227, | |
"total_flos": 1.550560221462528e+18, | |
"train_loss": 3.0875192876465034, | |
"train_runtime": 49059.1729, | |
"train_samples": 494517, | |
"train_samples_per_second": 403.2, | |
"train_steps_per_second": 1.574 | |
} |