{ "epoch": 1.0, "eval_abs_diff": 0.4453125, "eval_all_logps_1": -656.8973388671875, "eval_all_logps_1_values": -656.8973388671875, "eval_all_logps_2": 434.6329040527344, "eval_all_logps_2_values": 434.6329345703125, "eval_logits/chosen": 5.71875, "eval_logits/rejected": 5.6875, "eval_logps/chosen": -1.9453125, "eval_logps/rejected": -2.03125, "eval_loss": 1.7800946235656738, "eval_original_losses": 1.796875, "eval_rewards/accuracies": 0.4404762089252472, "eval_rewards/chosen": -4.875, "eval_rewards/margins": 0.2001953125, "eval_rewards/rejected": -5.0625, "eval_runtime": 7.6194, "eval_samples": 1961, "eval_samples_per_second": 257.37, "eval_steps_per_second": 0.919, "eval_weight": 1.0 }