ThyroidTumorClassificationModel / trainer_state.json
SerdarHelli's picture
ThyroidTumorClassification
15de256
raw
history blame
8.08 kB
{
"best_metric": 0.8837209302325582,
"best_model_checkpoint": "Cvt-finetuned-thyroid/checkpoint-27",
"epoch": 30.0,
"global_step": 90,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"eval_f1": 0.5052631578947367,
"eval_loss": 0.687919557094574,
"eval_runtime": 0.6589,
"eval_samples_per_second": 144.182,
"eval_steps_per_second": 4.553,
"step": 3
},
{
"epoch": 2.0,
"eval_f1": 0.673076923076923,
"eval_loss": 0.6748365759849548,
"eval_runtime": 0.6341,
"eval_samples_per_second": 149.822,
"eval_steps_per_second": 4.731,
"step": 6
},
{
"epoch": 3.0,
"eval_f1": 0.8034188034188033,
"eval_loss": 0.6552020311355591,
"eval_runtime": 0.6415,
"eval_samples_per_second": 148.089,
"eval_steps_per_second": 4.676,
"step": 9
},
{
"epoch": 4.0,
"eval_f1": 0.88,
"eval_loss": 0.6357027888298035,
"eval_runtime": 0.6465,
"eval_samples_per_second": 146.936,
"eval_steps_per_second": 4.64,
"step": 12
},
{
"epoch": 5.0,
"eval_f1": 0.8615384615384616,
"eval_loss": 0.6192407011985779,
"eval_runtime": 0.6387,
"eval_samples_per_second": 148.729,
"eval_steps_per_second": 4.697,
"step": 15
},
{
"epoch": 6.0,
"eval_f1": 0.8769230769230769,
"eval_loss": 0.604374349117279,
"eval_runtime": 0.645,
"eval_samples_per_second": 147.298,
"eval_steps_per_second": 4.652,
"step": 18
},
{
"epoch": 7.0,
"eval_f1": 0.8769230769230769,
"eval_loss": 0.5909456014633179,
"eval_runtime": 0.6526,
"eval_samples_per_second": 145.576,
"eval_steps_per_second": 4.597,
"step": 21
},
{
"epoch": 8.0,
"eval_f1": 0.8769230769230769,
"eval_loss": 0.5791701674461365,
"eval_runtime": 0.6491,
"eval_samples_per_second": 146.347,
"eval_steps_per_second": 4.621,
"step": 24
},
{
"epoch": 8.33,
"learning_rate": 8.024691358024692e-06,
"loss": 0.638,
"step": 25
},
{
"epoch": 9.0,
"eval_f1": 0.8837209302325582,
"eval_loss": 0.5682619214057922,
"eval_runtime": 0.6497,
"eval_samples_per_second": 146.222,
"eval_steps_per_second": 4.618,
"step": 27
},
{
"epoch": 10.0,
"eval_f1": 0.8837209302325582,
"eval_loss": 0.5576053261756897,
"eval_runtime": 0.653,
"eval_samples_per_second": 145.478,
"eval_steps_per_second": 4.594,
"step": 30
},
{
"epoch": 11.0,
"eval_f1": 0.8837209302325582,
"eval_loss": 0.5474461913108826,
"eval_runtime": 0.651,
"eval_samples_per_second": 145.928,
"eval_steps_per_second": 4.608,
"step": 33
},
{
"epoch": 12.0,
"eval_f1": 0.8837209302325582,
"eval_loss": 0.5376133322715759,
"eval_runtime": 0.6594,
"eval_samples_per_second": 144.075,
"eval_steps_per_second": 4.55,
"step": 36
},
{
"epoch": 13.0,
"eval_f1": 0.8837209302325582,
"eval_loss": 0.5282223224639893,
"eval_runtime": 0.6631,
"eval_samples_per_second": 143.267,
"eval_steps_per_second": 4.524,
"step": 39
},
{
"epoch": 14.0,
"eval_f1": 0.8837209302325582,
"eval_loss": 0.5196569561958313,
"eval_runtime": 0.6551,
"eval_samples_per_second": 145.016,
"eval_steps_per_second": 4.579,
"step": 42
},
{
"epoch": 15.0,
"eval_f1": 0.8837209302325582,
"eval_loss": 0.5118635296821594,
"eval_runtime": 0.6658,
"eval_samples_per_second": 142.69,
"eval_steps_per_second": 4.506,
"step": 45
},
{
"epoch": 16.0,
"eval_f1": 0.8837209302325582,
"eval_loss": 0.5053044557571411,
"eval_runtime": 0.6565,
"eval_samples_per_second": 144.71,
"eval_steps_per_second": 4.57,
"step": 48
},
{
"epoch": 16.67,
"learning_rate": 4.938271604938272e-06,
"loss": 0.4926,
"step": 50
},
{
"epoch": 17.0,
"eval_f1": 0.8837209302325582,
"eval_loss": 0.49933797121047974,
"eval_runtime": 0.6612,
"eval_samples_per_second": 143.679,
"eval_steps_per_second": 4.537,
"step": 51
},
{
"epoch": 18.0,
"eval_f1": 0.8837209302325582,
"eval_loss": 0.4940946102142334,
"eval_runtime": 0.661,
"eval_samples_per_second": 143.726,
"eval_steps_per_second": 4.539,
"step": 54
},
{
"epoch": 19.0,
"eval_f1": 0.8837209302325582,
"eval_loss": 0.4895910918712616,
"eval_runtime": 0.6623,
"eval_samples_per_second": 143.44,
"eval_steps_per_second": 4.53,
"step": 57
},
{
"epoch": 20.0,
"eval_f1": 0.8837209302325582,
"eval_loss": 0.4853971004486084,
"eval_runtime": 0.6837,
"eval_samples_per_second": 138.946,
"eval_steps_per_second": 4.388,
"step": 60
},
{
"epoch": 21.0,
"eval_f1": 0.8837209302325582,
"eval_loss": 0.48188260197639465,
"eval_runtime": 0.6669,
"eval_samples_per_second": 142.45,
"eval_steps_per_second": 4.498,
"step": 63
},
{
"epoch": 22.0,
"eval_f1": 0.8837209302325582,
"eval_loss": 0.4790306091308594,
"eval_runtime": 0.6675,
"eval_samples_per_second": 142.322,
"eval_steps_per_second": 4.494,
"step": 66
},
{
"epoch": 23.0,
"eval_f1": 0.8837209302325582,
"eval_loss": 0.47673219442367554,
"eval_runtime": 0.6755,
"eval_samples_per_second": 140.639,
"eval_steps_per_second": 4.441,
"step": 69
},
{
"epoch": 24.0,
"eval_f1": 0.8837209302325582,
"eval_loss": 0.4748006761074066,
"eval_runtime": 0.6675,
"eval_samples_per_second": 142.313,
"eval_steps_per_second": 4.494,
"step": 72
},
{
"epoch": 25.0,
"learning_rate": 1.8518518518518519e-06,
"loss": 0.4289,
"step": 75
},
{
"epoch": 25.0,
"eval_f1": 0.8837209302325582,
"eval_loss": 0.4731859564781189,
"eval_runtime": 0.6627,
"eval_samples_per_second": 143.353,
"eval_steps_per_second": 4.527,
"step": 75
},
{
"epoch": 26.0,
"eval_f1": 0.8837209302325582,
"eval_loss": 0.4718676507472992,
"eval_runtime": 0.6719,
"eval_samples_per_second": 141.397,
"eval_steps_per_second": 4.465,
"step": 78
},
{
"epoch": 27.0,
"eval_f1": 0.8837209302325582,
"eval_loss": 0.4708217680454254,
"eval_runtime": 0.68,
"eval_samples_per_second": 139.706,
"eval_steps_per_second": 4.412,
"step": 81
},
{
"epoch": 28.0,
"eval_f1": 0.8837209302325582,
"eval_loss": 0.47011542320251465,
"eval_runtime": 0.6739,
"eval_samples_per_second": 140.966,
"eval_steps_per_second": 4.452,
"step": 84
},
{
"epoch": 29.0,
"eval_f1": 0.8837209302325582,
"eval_loss": 0.4697326123714447,
"eval_runtime": 0.6728,
"eval_samples_per_second": 141.199,
"eval_steps_per_second": 4.459,
"step": 87
},
{
"epoch": 30.0,
"eval_f1": 0.8837209302325582,
"eval_loss": 0.4695647060871124,
"eval_runtime": 0.6801,
"eval_samples_per_second": 139.689,
"eval_steps_per_second": 4.411,
"step": 90
},
{
"epoch": 30.0,
"step": 90,
"total_flos": 2.8570124903878656e+17,
"train_loss": 0.5013438595665826,
"train_runtime": 222.831,
"train_samples_per_second": 51.025,
"train_steps_per_second": 0.404
}
],
"max_steps": 90,
"num_train_epochs": 30,
"total_flos": 2.8570124903878656e+17,
"trial_name": null,
"trial_params": null
}