{ | |
"epoch": 9.885931558935361, | |
"eval_accuracy": 0.36815393801226726, | |
"eval_loss": 3.1956684589385986, | |
"eval_runtime": 1.526, | |
"eval_samples": 18, | |
"eval_samples_per_second": 11.796, | |
"eval_steps_per_second": 1.966, | |
"perplexity": 24.42649634599656, | |
"total_flos": 5425467752448000.0, | |
"train_loss": 2.6658438814603365, | |
"train_runtime": 1438.1403, | |
"train_samples": 525, | |
"train_samples_per_second": 3.651, | |
"train_steps_per_second": 0.452 | |
} |