|
{ |
|
"epoch": 3.0, |
|
"eval_logits/chosen": -2.4403114318847656, |
|
"eval_logits/rejected": -2.160489320755005, |
|
"eval_logps/chosen": -84.75238800048828, |
|
"eval_logps/rejected": -121.9200210571289, |
|
"eval_loss": 0.009359963238239288, |
|
"eval_rewards/accuracies": 0.9916201233863831, |
|
"eval_rewards/chosen": -1.2833248376846313, |
|
"eval_rewards/margins": 28.446029663085938, |
|
"eval_rewards/rejected": -29.729354858398438, |
|
"eval_runtime": 194.4792, |
|
"eval_samples": 2862, |
|
"eval_samples_per_second": 14.716, |
|
"eval_steps_per_second": 0.92 |
|
} |