smolm-mlm-bpe-unmask-seed_222 / all_results.json
kanishka's picture
End of training
0962286
raw
history blame contribute delete
447 Bytes
{
"epoch": 10.0,
"eval_accuracy": 0.44805263716438504,
"eval_loss": 2.700531244277954,
"eval_runtime": 8.6873,
"eval_samples": 70000,
"eval_samples_per_second": 8057.703,
"eval_steps_per_second": 15.77,
"perplexity": 14.887638597263566,
"train_loss": 3.087518670990711,
"train_runtime": 7284.0934,
"train_samples": 763989,
"train_samples_per_second": 1048.846,
"train_steps_per_second": 16.389
}