qwen2-0.5b-sft / all_results.json
yinmingzhang's picture
End of training
ce6834c verified
raw
history blame contribute delete
419 Bytes
{
"epoch": 0.9993049349617714,
"eval_loss": 1.5326507091522217,
"eval_runtime": 223.1588,
"eval_samples": 23109,
"eval_samples_per_second": 119.843,
"eval_steps_per_second": 4.996,
"total_flos": 106161864966144.0,
"train_loss": 1.5477431688475496,
"train_runtime": 10888.6684,
"train_samples": 207864,
"train_samples_per_second": 22.196,
"train_steps_per_second": 0.116
}