{ "before_init_mem_cpu": 1261252608, "before_init_mem_gpu": 0, "epoch": 3.0, "init_mem_cpu_alloc_delta": 835670016, "init_mem_cpu_peaked_delta": 91971584, "init_mem_gpu_alloc_delta": 443396608, "init_mem_gpu_peaked_delta": 0, "train_loss": 1.5746790189531785, "train_mem_cpu_alloc_delta": 1865678848, "train_mem_cpu_peaked_delta": 333721600, "train_mem_gpu_alloc_delta": 1350910464, "train_mem_gpu_peaked_delta": 21529119744, "train_runtime": 8836.9123, "train_samples": 3234398, "train_samples_per_second": 1098.03, "train_steps_per_second": 0.429 }