{ | |
"epoch": 3.0, | |
"eval_loss": 2.030430555343628, | |
"eval_runtime": 15.4256, | |
"eval_samples": 1000, | |
"eval_samples_per_second": 64.827, | |
"eval_steps_per_second": 8.103, | |
"perplexity": 7.617365350191575, | |
"train_loss": 2.1000711460306185, | |
"train_runtime": 3427.7755, | |
"train_samples": 19004, | |
"train_samples_per_second": 16.632, | |
"train_steps_per_second": 0.26 | |
} |