qwen2.5-7b-idea-review-mvp-1 / all_results.json
sumuks's picture
End of training
5fa1c3d verified
raw
history blame contribute delete
379 Bytes
{
"epoch": 3.0,
"eval_loss": 1.2680052518844604,
"eval_runtime": 37.3047,
"eval_samples_per_second": 10.32,
"eval_steps_per_second": 2.6,
"perplexity": 3.553756638060757,
"total_flos": 234145141751808.0,
"train_loss": 1.2264163225196905,
"train_runtime": 4742.9935,
"train_samples_per_second": 24.104,
"train_steps_per_second": 0.753
}