gemma-2-Ifable-9B / all_results.json
linzaiyun's picture
Upload folder using huggingface_hub
eea2579 verified
{
"before_init_mem_cpu": 3802071040,
"before_init_mem_gpu": 22016,
"epoch": 0.9807355516637478,
"eval_logits/chosen": -12.004097938537598,
"eval_logits/rejected": -17.047502517700195,
"eval_logps/chosen": -2.168222427368164,
"eval_logps/rejected": -4.787535667419434,
"eval_loss": 1.0162526369094849,
"eval_mem_cpu_alloc_delta": 466944,
"eval_mem_cpu_peaked_delta": 0,
"eval_mem_gpu_alloc_delta": 0,
"eval_mem_gpu_peaked_delta": 25220711424,
"eval_rewards/accuracies": 0.9166666865348816,
"eval_rewards/chosen": -21.682226181030273,
"eval_rewards/margins": 26.193130493164062,
"eval_rewards/rejected": -47.875362396240234,
"eval_runtime": 9.9413,
"eval_samples_per_second": 9.456,
"eval_sft_loss": 0.01844729855656624,
"eval_steps_per_second": 1.207,
"init_mem_cpu_alloc_delta": 364544,
"init_mem_cpu_peaked_delta": 0,
"init_mem_gpu_alloc_delta": 0,
"init_mem_gpu_peaked_delta": 0,
"total_flos": 39867492466688.0,
"train_loss": 3.085822834287371,
"train_mem_cpu_alloc_delta": 5213659136,
"train_mem_cpu_peaked_delta": 22737326080,
"train_mem_gpu_alloc_delta": 16267848704,
"train_mem_gpu_peaked_delta": 36029468160,
"train_runtime": 1628.7465,
"train_samples_per_second": 2.805,
"train_steps_per_second": 0.021
}