{ "best_metric": 0.8837209302325582, "best_model_checkpoint": "Cvt-finetuned-thyroid/checkpoint-27", "epoch": 30.0, "global_step": 90, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "eval_f1": 0.5052631578947367, "eval_loss": 0.687919557094574, "eval_runtime": 0.6589, "eval_samples_per_second": 144.182, "eval_steps_per_second": 4.553, "step": 3 }, { "epoch": 2.0, "eval_f1": 0.673076923076923, "eval_loss": 0.6748365759849548, "eval_runtime": 0.6341, "eval_samples_per_second": 149.822, "eval_steps_per_second": 4.731, "step": 6 }, { "epoch": 3.0, "eval_f1": 0.8034188034188033, "eval_loss": 0.6552020311355591, "eval_runtime": 0.6415, "eval_samples_per_second": 148.089, "eval_steps_per_second": 4.676, "step": 9 }, { "epoch": 4.0, "eval_f1": 0.88, "eval_loss": 0.6357027888298035, "eval_runtime": 0.6465, "eval_samples_per_second": 146.936, "eval_steps_per_second": 4.64, "step": 12 }, { "epoch": 5.0, "eval_f1": 0.8615384615384616, "eval_loss": 0.6192407011985779, "eval_runtime": 0.6387, "eval_samples_per_second": 148.729, "eval_steps_per_second": 4.697, "step": 15 }, { "epoch": 6.0, "eval_f1": 0.8769230769230769, "eval_loss": 0.604374349117279, "eval_runtime": 0.645, "eval_samples_per_second": 147.298, "eval_steps_per_second": 4.652, "step": 18 }, { "epoch": 7.0, "eval_f1": 0.8769230769230769, "eval_loss": 0.5909456014633179, "eval_runtime": 0.6526, "eval_samples_per_second": 145.576, "eval_steps_per_second": 4.597, "step": 21 }, { "epoch": 8.0, "eval_f1": 0.8769230769230769, "eval_loss": 0.5791701674461365, "eval_runtime": 0.6491, "eval_samples_per_second": 146.347, "eval_steps_per_second": 4.621, "step": 24 }, { "epoch": 8.33, "learning_rate": 8.024691358024692e-06, "loss": 0.638, "step": 25 }, { "epoch": 9.0, "eval_f1": 0.8837209302325582, "eval_loss": 0.5682619214057922, "eval_runtime": 0.6497, "eval_samples_per_second": 146.222, "eval_steps_per_second": 4.618, "step": 27 }, { "epoch": 10.0, "eval_f1": 0.8837209302325582, "eval_loss": 0.5576053261756897, "eval_runtime": 0.653, "eval_samples_per_second": 145.478, "eval_steps_per_second": 4.594, "step": 30 }, { "epoch": 11.0, "eval_f1": 0.8837209302325582, "eval_loss": 0.5474461913108826, "eval_runtime": 0.651, "eval_samples_per_second": 145.928, "eval_steps_per_second": 4.608, "step": 33 }, { "epoch": 12.0, "eval_f1": 0.8837209302325582, "eval_loss": 0.5376133322715759, "eval_runtime": 0.6594, "eval_samples_per_second": 144.075, "eval_steps_per_second": 4.55, "step": 36 }, { "epoch": 13.0, "eval_f1": 0.8837209302325582, "eval_loss": 0.5282223224639893, "eval_runtime": 0.6631, "eval_samples_per_second": 143.267, "eval_steps_per_second": 4.524, "step": 39 }, { "epoch": 14.0, "eval_f1": 0.8837209302325582, "eval_loss": 0.5196569561958313, "eval_runtime": 0.6551, "eval_samples_per_second": 145.016, "eval_steps_per_second": 4.579, "step": 42 }, { "epoch": 15.0, "eval_f1": 0.8837209302325582, "eval_loss": 0.5118635296821594, "eval_runtime": 0.6658, "eval_samples_per_second": 142.69, "eval_steps_per_second": 4.506, "step": 45 }, { "epoch": 16.0, "eval_f1": 0.8837209302325582, "eval_loss": 0.5053044557571411, "eval_runtime": 0.6565, "eval_samples_per_second": 144.71, "eval_steps_per_second": 4.57, "step": 48 }, { "epoch": 16.67, "learning_rate": 4.938271604938272e-06, "loss": 0.4926, "step": 50 }, { "epoch": 17.0, "eval_f1": 0.8837209302325582, "eval_loss": 0.49933797121047974, "eval_runtime": 0.6612, "eval_samples_per_second": 143.679, "eval_steps_per_second": 4.537, "step": 51 }, { "epoch": 18.0, "eval_f1": 0.8837209302325582, "eval_loss": 0.4940946102142334, "eval_runtime": 0.661, "eval_samples_per_second": 143.726, "eval_steps_per_second": 4.539, "step": 54 }, { "epoch": 19.0, "eval_f1": 0.8837209302325582, "eval_loss": 0.4895910918712616, "eval_runtime": 0.6623, "eval_samples_per_second": 143.44, "eval_steps_per_second": 4.53, "step": 57 }, { "epoch": 20.0, "eval_f1": 0.8837209302325582, "eval_loss": 0.4853971004486084, "eval_runtime": 0.6837, "eval_samples_per_second": 138.946, "eval_steps_per_second": 4.388, "step": 60 }, { "epoch": 21.0, "eval_f1": 0.8837209302325582, "eval_loss": 0.48188260197639465, "eval_runtime": 0.6669, "eval_samples_per_second": 142.45, "eval_steps_per_second": 4.498, "step": 63 }, { "epoch": 22.0, "eval_f1": 0.8837209302325582, "eval_loss": 0.4790306091308594, "eval_runtime": 0.6675, "eval_samples_per_second": 142.322, "eval_steps_per_second": 4.494, "step": 66 }, { "epoch": 23.0, "eval_f1": 0.8837209302325582, "eval_loss": 0.47673219442367554, "eval_runtime": 0.6755, "eval_samples_per_second": 140.639, "eval_steps_per_second": 4.441, "step": 69 }, { "epoch": 24.0, "eval_f1": 0.8837209302325582, "eval_loss": 0.4748006761074066, "eval_runtime": 0.6675, "eval_samples_per_second": 142.313, "eval_steps_per_second": 4.494, "step": 72 }, { "epoch": 25.0, "learning_rate": 1.8518518518518519e-06, "loss": 0.4289, "step": 75 }, { "epoch": 25.0, "eval_f1": 0.8837209302325582, "eval_loss": 0.4731859564781189, "eval_runtime": 0.6627, "eval_samples_per_second": 143.353, "eval_steps_per_second": 4.527, "step": 75 }, { "epoch": 26.0, "eval_f1": 0.8837209302325582, "eval_loss": 0.4718676507472992, "eval_runtime": 0.6719, "eval_samples_per_second": 141.397, "eval_steps_per_second": 4.465, "step": 78 }, { "epoch": 27.0, "eval_f1": 0.8837209302325582, "eval_loss": 0.4708217680454254, "eval_runtime": 0.68, "eval_samples_per_second": 139.706, "eval_steps_per_second": 4.412, "step": 81 }, { "epoch": 28.0, "eval_f1": 0.8837209302325582, "eval_loss": 0.47011542320251465, "eval_runtime": 0.6739, "eval_samples_per_second": 140.966, "eval_steps_per_second": 4.452, "step": 84 }, { "epoch": 29.0, "eval_f1": 0.8837209302325582, "eval_loss": 0.4697326123714447, "eval_runtime": 0.6728, "eval_samples_per_second": 141.199, "eval_steps_per_second": 4.459, "step": 87 }, { "epoch": 30.0, "eval_f1": 0.8837209302325582, "eval_loss": 0.4695647060871124, "eval_runtime": 0.6801, "eval_samples_per_second": 139.689, "eval_steps_per_second": 4.411, "step": 90 }, { "epoch": 30.0, "step": 90, "total_flos": 2.8570124903878656e+17, "train_loss": 0.5013438595665826, "train_runtime": 222.831, "train_samples_per_second": 51.025, "train_steps_per_second": 0.404 } ], "max_steps": 90, "num_train_epochs": 30, "total_flos": 2.8570124903878656e+17, "trial_name": null, "trial_params": null }