{ | |
"epoch": 35.0, | |
"eval_accuracy": 0.5302221081011683, | |
"eval_loss": 2.9193999767303467, | |
"eval_runtime": 31.3487, | |
"eval_samples": 4053, | |
"eval_samples_per_second": 129.287, | |
"eval_steps_per_second": 32.346, | |
"perplexity": 18.530165592844845, | |
"total_flos": 1.8479030675124096e+17, | |
"train_loss": 0.37831091759340585, | |
"train_runtime": 6392.496, | |
"train_samples": 80219, | |
"train_samples_per_second": 439.213, | |
"train_steps_per_second": 27.453 | |
} |