{ | |
"epoch": 1.995634549423137, | |
"eval_accuracy": 0.3789325513196481, | |
"eval_loss": 4.358436584472656, | |
"eval_runtime": 20.603, | |
"eval_samples": 250, | |
"eval_samples_per_second": 12.134, | |
"eval_steps_per_second": 3.058, | |
"perplexity": 78.13488159488827, | |
"total_flos": 6.441101073108173e+16, | |
"train_loss": 8.280340445041656, | |
"train_runtime": 18888.2342, | |
"train_samples": 51310, | |
"train_samples_per_second": 5.433, | |
"train_steps_per_second": 0.042 | |
} |