epoch = 11.55 train_loss = 2.541904963623047 train_runtime = 186540.8186 train_samples_per_second = 686.177 train_steps_per_second = 2.68