m2m100_1.2B_ft_kbd-ru_63K / all_results.json
anzorq's picture
End of training
824dc30
raw
history blame
443 Bytes
{
"epoch": 2.27,
"predict_bleu": 25.5069,
"predict_gen_len": 9.3963,
"predict_loss": 1.5133029222488403,
"predict_runtime": 98.9855,
"predict_samples": 641,
"predict_samples_per_second": 6.476,
"predict_steps_per_second": 0.414,
"train_loss": 5.4469778463318936e-05,
"train_runtime": 1.6018,
"train_samples": 63407,
"train_samples_per_second": 89898.478,
"train_steps_per_second": 5618.655
}