{ | |
"epoch": 2.0, | |
"eval_accuracy": 0.2550262872843518, | |
"eval_loss": 5.2102789878845215, | |
"eval_runtime": 10.0113, | |
"eval_samples": 37, | |
"eval_samples_per_second": 3.696, | |
"eval_steps_per_second": 1.898, | |
"perplexity": 183.14514634383818, | |
"total_flos": 4578913057505280.0, | |
"train_loss": 6.445547739664714, | |
"train_runtime": 1136.4366, | |
"train_samples": 767, | |
"train_samples_per_second": 1.35, | |
"train_steps_per_second": 0.169 | |
} |