Goedel-Prover-DPO / eval_results.json
linyongver's picture
Upload folder using huggingface_hub
efd7552 verified
{
"epoch": 1.998667732480682,
"eval_logits/chosen": -13.45787239074707,
"eval_logits/rejected": -12.986124992370605,
"eval_logps/chosen": -209.70858764648438,
"eval_logps/rejected": -266.514404296875,
"eval_loss": 0.535685658454895,
"eval_rewards/accuracies": 0.7565789818763733,
"eval_rewards/chosen": -4.100185394287109,
"eval_rewards/margins": 1.7237099409103394,
"eval_rewards/rejected": -5.823895454406738,
"eval_runtime": 15.7482,
"eval_samples_per_second": 19.304,
"eval_steps_per_second": 2.413
}