|
{ |
|
"best_metric": 0.19675925925925927, |
|
"best_model_checkpoint": "microsoft-resnet-50-cartoon-face-recognition/checkpoint-24", |
|
"epoch": 19.88888888888889, |
|
"global_step": 120, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.89, |
|
"eval_accuracy": 0.06712962962962964, |
|
"eval_f1": 0.04268330700511537, |
|
"eval_loss": 3.1718316078186035, |
|
"eval_precision": 0.07750900471648707, |
|
"eval_recall": 0.06712962962962964, |
|
"eval_runtime": 6.9896, |
|
"eval_samples_per_second": 61.806, |
|
"eval_steps_per_second": 1.001, |
|
"step": 6 |
|
}, |
|
{ |
|
"epoch": 1.59, |
|
"learning_rate": 0.0001, |
|
"loss": 3.409, |
|
"step": 10 |
|
}, |
|
{ |
|
"epoch": 1.89, |
|
"eval_accuracy": 0.09722222222222222, |
|
"eval_f1": 0.06941620132016908, |
|
"eval_loss": 3.1434757709503174, |
|
"eval_precision": 0.09483282105538404, |
|
"eval_recall": 0.09722222222222222, |
|
"eval_runtime": 6.3177, |
|
"eval_samples_per_second": 68.379, |
|
"eval_steps_per_second": 1.108, |
|
"step": 12 |
|
}, |
|
{ |
|
"epoch": 2.89, |
|
"eval_accuracy": 0.16666666666666666, |
|
"eval_f1": 0.1157640285514969, |
|
"eval_loss": 3.1100411415100098, |
|
"eval_precision": 0.12231976324858271, |
|
"eval_recall": 0.16666666666666666, |
|
"eval_runtime": 5.8995, |
|
"eval_samples_per_second": 73.226, |
|
"eval_steps_per_second": 1.187, |
|
"step": 18 |
|
}, |
|
{ |
|
"epoch": 3.3, |
|
"learning_rate": 0.00011111111111111112, |
|
"loss": 3.597, |
|
"step": 20 |
|
}, |
|
{ |
|
"epoch": 3.89, |
|
"eval_accuracy": 0.19675925925925927, |
|
"eval_f1": 0.11625378991501253, |
|
"eval_loss": 3.0767667293548584, |
|
"eval_precision": 0.13583887289090224, |
|
"eval_recall": 0.19675925925925927, |
|
"eval_runtime": 5.9054, |
|
"eval_samples_per_second": 73.153, |
|
"eval_steps_per_second": 1.185, |
|
"step": 24 |
|
}, |
|
{ |
|
"epoch": 4.89, |
|
"learning_rate": 0.0001, |
|
"loss": 3.2968, |
|
"step": 30 |
|
}, |
|
{ |
|
"epoch": 4.89, |
|
"eval_accuracy": 0.17592592592592593, |
|
"eval_f1": 0.08794959812293887, |
|
"eval_loss": 3.051513195037842, |
|
"eval_precision": 0.08687890109673733, |
|
"eval_recall": 0.17592592592592593, |
|
"eval_runtime": 5.8218, |
|
"eval_samples_per_second": 74.204, |
|
"eval_steps_per_second": 1.202, |
|
"step": 30 |
|
}, |
|
{ |
|
"epoch": 5.89, |
|
"eval_accuracy": 0.1712962962962963, |
|
"eval_f1": 0.06999759781046332, |
|
"eval_loss": 3.0226213932037354, |
|
"eval_precision": 0.0456331710295125, |
|
"eval_recall": 0.1712962962962963, |
|
"eval_runtime": 5.7818, |
|
"eval_samples_per_second": 74.718, |
|
"eval_steps_per_second": 1.211, |
|
"step": 36 |
|
}, |
|
{ |
|
"epoch": 6.59, |
|
"learning_rate": 8.888888888888888e-05, |
|
"loss": 3.4662, |
|
"step": 40 |
|
}, |
|
{ |
|
"epoch": 6.89, |
|
"eval_accuracy": 0.16666666666666666, |
|
"eval_f1": 0.07065656451437614, |
|
"eval_loss": 2.9997007846832275, |
|
"eval_precision": 0.04987179172442097, |
|
"eval_recall": 0.16666666666666666, |
|
"eval_runtime": 5.8712, |
|
"eval_samples_per_second": 73.579, |
|
"eval_steps_per_second": 1.192, |
|
"step": 42 |
|
}, |
|
{ |
|
"epoch": 7.89, |
|
"eval_accuracy": 0.1550925925925926, |
|
"eval_f1": 0.06279659825962769, |
|
"eval_loss": 2.977167844772339, |
|
"eval_precision": 0.046044346719881876, |
|
"eval_recall": 0.1550925925925926, |
|
"eval_runtime": 5.7878, |
|
"eval_samples_per_second": 74.64, |
|
"eval_steps_per_second": 1.209, |
|
"step": 48 |
|
}, |
|
{ |
|
"epoch": 8.3, |
|
"learning_rate": 7.777777777777778e-05, |
|
"loss": 3.4141, |
|
"step": 50 |
|
}, |
|
{ |
|
"epoch": 8.89, |
|
"eval_accuracy": 0.18518518518518517, |
|
"eval_f1": 0.08918606274115107, |
|
"eval_loss": 2.9533445835113525, |
|
"eval_precision": 0.16404070934618162, |
|
"eval_recall": 0.18518518518518517, |
|
"eval_runtime": 6.9368, |
|
"eval_samples_per_second": 62.277, |
|
"eval_steps_per_second": 1.009, |
|
"step": 54 |
|
}, |
|
{ |
|
"epoch": 9.89, |
|
"learning_rate": 6.666666666666667e-05, |
|
"loss": 3.1376, |
|
"step": 60 |
|
}, |
|
{ |
|
"epoch": 9.89, |
|
"eval_accuracy": 0.16666666666666666, |
|
"eval_f1": 0.07419287680822054, |
|
"eval_loss": 2.931124448776245, |
|
"eval_precision": 0.08951358417023512, |
|
"eval_recall": 0.16666666666666666, |
|
"eval_runtime": 5.8186, |
|
"eval_samples_per_second": 74.244, |
|
"eval_steps_per_second": 1.203, |
|
"step": 60 |
|
}, |
|
{ |
|
"epoch": 10.89, |
|
"eval_accuracy": 0.16435185185185186, |
|
"eval_f1": 0.0724480953675622, |
|
"eval_loss": 2.920067310333252, |
|
"eval_precision": 0.08232943904512993, |
|
"eval_recall": 0.16435185185185186, |
|
"eval_runtime": 5.8821, |
|
"eval_samples_per_second": 73.444, |
|
"eval_steps_per_second": 1.19, |
|
"step": 66 |
|
}, |
|
{ |
|
"epoch": 11.59, |
|
"learning_rate": 5.555555555555556e-05, |
|
"loss": 3.3113, |
|
"step": 70 |
|
}, |
|
{ |
|
"epoch": 11.89, |
|
"eval_accuracy": 0.16435185185185186, |
|
"eval_f1": 0.07315703439667075, |
|
"eval_loss": 2.896663188934326, |
|
"eval_precision": 0.0995273854967043, |
|
"eval_recall": 0.16435185185185186, |
|
"eval_runtime": 5.8475, |
|
"eval_samples_per_second": 73.877, |
|
"eval_steps_per_second": 1.197, |
|
"step": 72 |
|
}, |
|
{ |
|
"epoch": 12.89, |
|
"eval_accuracy": 0.1574074074074074, |
|
"eval_f1": 0.06788189816821627, |
|
"eval_loss": 2.8926467895507812, |
|
"eval_precision": 0.07378815753932359, |
|
"eval_recall": 0.1574074074074074, |
|
"eval_runtime": 6.731, |
|
"eval_samples_per_second": 64.181, |
|
"eval_steps_per_second": 1.04, |
|
"step": 78 |
|
}, |
|
{ |
|
"epoch": 13.3, |
|
"learning_rate": 4.444444444444444e-05, |
|
"loss": 3.2872, |
|
"step": 80 |
|
}, |
|
{ |
|
"epoch": 13.89, |
|
"eval_accuracy": 0.1712962962962963, |
|
"eval_f1": 0.07606979068720418, |
|
"eval_loss": 2.8844218254089355, |
|
"eval_precision": 0.0804587704274602, |
|
"eval_recall": 0.1712962962962963, |
|
"eval_runtime": 5.7658, |
|
"eval_samples_per_second": 74.924, |
|
"eval_steps_per_second": 1.214, |
|
"step": 84 |
|
}, |
|
{ |
|
"epoch": 14.89, |
|
"learning_rate": 3.3333333333333335e-05, |
|
"loss": 3.0305, |
|
"step": 90 |
|
}, |
|
{ |
|
"epoch": 14.89, |
|
"eval_accuracy": 0.1712962962962963, |
|
"eval_f1": 0.07456109408196694, |
|
"eval_loss": 2.8605401515960693, |
|
"eval_precision": 0.09364712421465295, |
|
"eval_recall": 0.1712962962962963, |
|
"eval_runtime": 5.8764, |
|
"eval_samples_per_second": 73.515, |
|
"eval_steps_per_second": 1.191, |
|
"step": 90 |
|
}, |
|
{ |
|
"epoch": 15.89, |
|
"eval_accuracy": 0.17592592592592593, |
|
"eval_f1": 0.077154753687655, |
|
"eval_loss": 2.8563218116760254, |
|
"eval_precision": 0.09599160283239885, |
|
"eval_recall": 0.17592592592592593, |
|
"eval_runtime": 5.8036, |
|
"eval_samples_per_second": 74.436, |
|
"eval_steps_per_second": 1.206, |
|
"step": 96 |
|
}, |
|
{ |
|
"epoch": 16.59, |
|
"learning_rate": 2.222222222222222e-05, |
|
"loss": 3.2263, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 16.89, |
|
"eval_accuracy": 0.1712962962962963, |
|
"eval_f1": 0.07532319701759846, |
|
"eval_loss": 2.8487489223480225, |
|
"eval_precision": 0.10121344883941782, |
|
"eval_recall": 0.1712962962962963, |
|
"eval_runtime": 5.766, |
|
"eval_samples_per_second": 74.921, |
|
"eval_steps_per_second": 1.214, |
|
"step": 102 |
|
}, |
|
{ |
|
"epoch": 17.89, |
|
"eval_accuracy": 0.1712962962962963, |
|
"eval_f1": 0.07721457778893034, |
|
"eval_loss": 2.8424181938171387, |
|
"eval_precision": 0.12103390482470601, |
|
"eval_recall": 0.1712962962962963, |
|
"eval_runtime": 5.8577, |
|
"eval_samples_per_second": 73.749, |
|
"eval_steps_per_second": 1.195, |
|
"step": 108 |
|
}, |
|
{ |
|
"epoch": 18.3, |
|
"learning_rate": 1.111111111111111e-05, |
|
"loss": 3.1927, |
|
"step": 110 |
|
}, |
|
{ |
|
"epoch": 18.89, |
|
"eval_accuracy": 0.1736111111111111, |
|
"eval_f1": 0.07100199262795664, |
|
"eval_loss": 2.837003707885742, |
|
"eval_precision": 0.05610008615248136, |
|
"eval_recall": 0.1736111111111111, |
|
"eval_runtime": 5.7707, |
|
"eval_samples_per_second": 74.861, |
|
"eval_steps_per_second": 1.213, |
|
"step": 114 |
|
}, |
|
{ |
|
"epoch": 19.89, |
|
"learning_rate": 0.0, |
|
"loss": 2.992, |
|
"step": 120 |
|
}, |
|
{ |
|
"epoch": 19.89, |
|
"eval_accuracy": 0.18055555555555555, |
|
"eval_f1": 0.08808104613908821, |
|
"eval_loss": 2.849083423614502, |
|
"eval_precision": 0.15482731189307494, |
|
"eval_recall": 0.18055555555555555, |
|
"eval_runtime": 5.8109, |
|
"eval_samples_per_second": 74.343, |
|
"eval_steps_per_second": 1.205, |
|
"step": 120 |
|
}, |
|
{ |
|
"epoch": 19.89, |
|
"step": 120, |
|
"total_flos": 7.312175696361554e+17, |
|
"train_loss": 3.2800607363382976, |
|
"train_runtime": 455.8097, |
|
"train_samples_per_second": 75.821, |
|
"train_steps_per_second": 0.263 |
|
} |
|
], |
|
"max_steps": 120, |
|
"num_train_epochs": 20, |
|
"total_flos": 7.312175696361554e+17, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|