{ | |
"epoch": 6.74, | |
"eval_loss": 2.2311766147613525, | |
"eval_runtime": 346.8001, | |
"eval_samples": 299980, | |
"eval_samples_per_second": 864.994, | |
"eval_steps_per_second": 54.063, | |
"perplexity": 9.310814879187836, | |
"train_loss": 2.443978935546875, | |
"train_runtime": 257950.5102, | |
"train_samples": 5699618, | |
"train_samples_per_second": 148.866, | |
"train_steps_per_second": 9.304 | |
} |