yakazimir's picture
End of training
193f4bd verified
raw
history blame contribute delete
785 Bytes
{
"epoch": 1.9978142076502732,
"eval_logits/chosen": -1.4140465259552002,
"eval_logits/rejected": -1.3327398300170898,
"eval_logps/chosen": -0.8071117401123047,
"eval_logps/rejected": -1.9723843336105347,
"eval_loss": 1.2685352563858032,
"eval_rewards/accuracies": 0.8674699068069458,
"eval_rewards/chosen": -8.071117401123047,
"eval_rewards/margins": 11.652724266052246,
"eval_rewards/rejected": -19.723840713500977,
"eval_runtime": 33.7378,
"eval_samples": 1318,
"eval_samples_per_second": 39.066,
"eval_steps_per_second": 2.46,
"total_flos": 0.0,
"train_loss": 1.4686054226084402,
"train_runtime": 12099.7941,
"train_samples": 58558,
"train_samples_per_second": 9.679,
"train_steps_per_second": 0.076
}